Article(id=1204385487667568928, tenantId=1146029695717560320, journalId=1189621681917173762, issueId=1204385484878356718, articleNumber=null, orderNo=null, doi=10.19620/j.cnki.1000-3703.20220500, pmid=null, cstr=null, oa=null, hot=null, price=null, onlineType=0, articleFormat=0, articleType=null, articleTypeStr=research-article, receivedDate=null, receivedDateStr=null, revisedDate=1657814400000, revisedDateStr=2022-07-15, acceptedDate=null, acceptedDateStr=null, onlineDate=1765077476659, onlineDateStr=2025-12-07, pubDate=1679587200000, pubDateStr=2023-03-24, doiRegisterDate=null, doiRegisterDateStr=null, onlineIssueDate=1765077476659, onlineIssueDateStr=2025-12-07, onlineJustAcceptDate=null, onlineJustAcceptDateStr=null, onlineFirstDate=null, onlineFirstDateStr=null, sourceXml=null, magXml=null, createTime=1765077476659, creator=13701087609, updateTime=1765077476659, updator=13701087609, issue=Issue{id=1204385484878356718, tenantId=1146029695717560320, journalId=1189621681917173762, year='2023', volume='', issue='3', pageStart='1', pageEnd='62', issueExtLink='null', onlineDate='null', pubDate='null', beforeIssueId=null, nextIssueId=null, price=null, status=1, issueComplete=1, articleOrder=1, issueType=-1, specialIssue=null, createTime=1765077475995, creator=13701087609, updateTime=1765079076236, updator=13701087609, preIssue=null, nextIssue=null, ext={EN=IssueExt(id=1204392196872053307, tenantId=1146029695717560320, journalId=1189621681917173762, issueId=1204385484878356718, language=EN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=), CN=IssueExt(id=1204392196872053308, tenantId=1146029695717560320, journalId=1189621681917173762, issueId=1204385484878356718, language=CN, specialIssueTitle=, coverIllustrator=null, specialIssueEditor=, specialIssueAbout=)}, issueFiles=null}, startPage=26, endPage=34, ext={EN=ArticleExt(id=1204385487856312614, articleId=1204385487667568928, tenantId=1146029695717560320, journalId=1189621681917173762, language=EN, title=Research on Adaptive Cruise Control Based on Soft Actor-Critic Algorithm, columnId=null, journalTitle=Automobile Technology, columnName=null, runingTitle=null, highlight=null, articleAbstract=
For the problems of adaptive cruise control technology, including insufficient environmental adaptability of control algorithm for Deep Reinforcement Learning (DRL), poor model mitigation and generalization ability, this paper proposed the Soft Actor-Critic (SAC) control algorithm based on the principle of maximum entropy and stochastic off-line policy. SAC network was built to fit action value function and action policy function, and auto-adjusting temperature coefficient was used to improve the environmental exploration ability of intelligent agent. For the problem of sparse reward, the reward function was designed by using the idea of reward shaping. In addition, a new experience replay mechanism was proposed to improve the utilization rate of samples. The proposed control algorithm was simulated and tested in different scenes, and compared with Deep Deterministic Policy Gradient (DDPG). The results show that the algorithm has better model generalization ability and migration effect on real vehicles.
, correspAuthors=null, authorNote=null, correspAuthorsNote=null, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=null, magXml=null, pdfUrl=null, pdf=null, pdfFileSize=null, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=null, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=null, mapNumber=null, authorCompany=null, fund=null, authors=null, authorsList=Kegang Zhao, Cuiduo Shi, Zhihao Liang, Ziqi Li, Yulong Wang), CN=ArticleExt(id=1204385491589243291, articleId=1204385487667568928, tenantId=1146029695717560320, journalId=1189621681917173762, language=CN, title=基于柔性演员-评论家算法的自适应巡航控制研究
*, columnId=0, journalTitle=汽车技术, columnName=, runingTitle=null, highlight=null, articleAbstract=
针对目前自适应巡航控制技术中,深度强化学习的控制算法环境适应能力不足、模型迁移性及泛化能力较差的问题,提出一种基于最大熵原理和随机离线策略的柔性演员-评论家(SAC)控制算法。构建演员和评论家网络拟合动作值函数和动作策略函数,并使用自调节温度系数改善智能体的环境探索能力;针对奖励稀疏问题,运用奖励塑造思想设计奖励函数;此外,提出一种新的经验回放机制以提高样本利用率。将所提出的控制算法在不同场景中进行仿真及实车验证,并与深度确定性策略梯度(DDPG)算法进行比较,结果表明,该算法具有更好的模型泛化能力和实车迁移效果。
, correspAuthors=null, authorNote=null, correspAuthorsNote=null, copyrightStatement=null, copyrightOwner=null, extLink=null, articleAbsUrl=null, sourceXml=37m9qQ/tW57jgL15fSBaGw==, magXml=hdBXumX+2wi9YunExe5IuA==, pdfUrl=null, pdf=l8Ht+SQNKa2D1Ck5VKw4uw==, pdfFileSize=2095749, pdfExtLink=null, richHtmlUrl=null, mobilePdfUrl=null, reviewReport=null, pdfFirstPage=null, abstractGraph=/U3VQOExIpQAKN9feLGDSg==, abstractGraphContent=null, abstractVideo=null, citation=null, cebUrl=null, magXmlContent=ArG+YgXqyNdP9rds5d9m2g==, mapNumber=null, authorCompany=null, fund=null, authors=null, authorsList=赵克刚, 石翠铎, 梁志豪, 李梓棋, 王玉龙)}, authors=[Author(id=1204452610616042496, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, orderNo=0, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1204452610800590868, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, authorId=1204452610616042496, language=EN, stringName=Kegang Zhao, firstName=Kegang, middleName=null, lastName=Zhao, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1 South China University of Technology, Guangzhou 510641, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1204452610901254178, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, authorId=1204452610616042496, language=CN, stringName=赵克刚, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1 华南理工大学,广州 510641, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1204452610192417745, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, xref=1, ext=[AuthorCompanyExt(id=1204452610209194965, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, companyId=1204452610192417745, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 South China University of Technology, Guangzhou 510641), AuthorCompanyExt(id=1204452610217583574, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, companyId=1204452610192417745, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 华南理工大学,广州 510641)])]), Author(id=1204452611043860530, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, orderNo=1, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1204452611295518790, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, authorId=1204452611043860530, language=EN, stringName=Cuiduo Shi, firstName=Cuiduo, middleName=null, lastName=Shi, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1 South China University of Technology, Guangzhou 510641, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1204452611391987793, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, authorId=1204452611043860530, language=CN, stringName=石翠铎, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1 华南理工大学,广州 510641, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1204452610192417745, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, xref=1, ext=[AuthorCompanyExt(id=1204452610209194965, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, companyId=1204452610192417745, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 South China University of Technology, Guangzhou 510641), AuthorCompanyExt(id=1204452610217583574, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, companyId=1204452610192417745, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 华南理工大学,广州 510641)])]), Author(id=1204452611467485282, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, orderNo=2, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1204452611584925808, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, authorId=1204452611467485282, language=EN, stringName=Zhihao Liang, firstName=Zhihao, middleName=null, lastName=Liang, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1 South China University of Technology, Guangzhou 510641, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1204452611681394814, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, authorId=1204452611467485282, language=CN, stringName=梁志豪, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1 华南理工大学,广州 510641, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1204452610192417745, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, xref=1, ext=[AuthorCompanyExt(id=1204452610209194965, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, companyId=1204452610192417745, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 South China University of Technology, Guangzhou 510641), AuthorCompanyExt(id=1204452610217583574, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, companyId=1204452610192417745, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 华南理工大学,广州 510641)])]), Author(id=1204452611811418260, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, orderNo=3, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1204452611916275873, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, authorId=1204452611811418260, language=EN, stringName=Ziqi Li, firstName=Ziqi, middleName=null, lastName=Li, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1 South China University of Technology, Guangzhou 510641, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1204452612033716403, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, authorId=1204452611811418260, language=CN, stringName=李梓棋, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
1, address=
1 华南理工大学,广州 510641, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1204452610192417745, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, xref=1, ext=[AuthorCompanyExt(id=1204452610209194965, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, companyId=1204452610192417745, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 South China University of Technology, Guangzhou 510641), AuthorCompanyExt(id=1204452610217583574, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, companyId=1204452610192417745, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 华南理工大学,广州 510641)])]), Author(id=1204452612142768319, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, orderNo=4, firstName=null, middleName=null, lastName=null, nameCn=null, orcid=null, stid=null, country=null, authorPic=null, dead=0, email=null, emailSecond=null, emailThird=null, correspondingAuthor=0, authorType=1, ext={EN=AuthorExt(id=1204452612297957585, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, authorId=1204452612142768319, language=EN, stringName=Yulong Wang, firstName=Yulong, middleName=null, lastName=Wang, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
2, address=
2 State Key Laboratory of Advanced Design and Manufacturing for Vehicle Body, Hunan University, Changsha 410082, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null), CN=AuthorExt(id=1204452612440563938, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, authorId=1204452612142768319, language=CN, stringName=王玉龙, firstName=null, middleName=null, lastName=null, prefix=null, suffix=null, authorComment=null, nameInitials=null, affiliation=null, department=null, xref=
2, address=
2 湖南大学,汽车车身先进设计制造国家重点实验室,长沙 410082, bio=null, bioImg=null, bioContent=null, aboutCorrespAuthor=null)}, companyList=[AuthorCompany(id=1204452610393744363, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, xref=2, ext=[AuthorCompanyExt(id=1204452610414715887, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, companyId=1204452610393744363, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2 State Key Laboratory of Advanced Design and Manufacturing for Vehicle Body, Hunan University, Changsha 410082), AuthorCompanyExt(id=1204452610439881712, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, companyId=1204452610393744363, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2 湖南大学,汽车车身先进设计制造国家重点实验室,长沙 410082)])])], keywords=[Keyword(id=1204452612708999422, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, orderNo=1, keyword=Adaptive cruise control), Keyword(id=1204452612797079817, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, orderNo=2, keyword=Soft Actor-Critic(SAC)), Keyword(id=1204452612927103257, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, orderNo=3, keyword=Mitigation), Keyword(id=1204452613073903916, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, orderNo=4, keyword=Deep Reinforcement Learning(DRL)), Keyword(id=1204452613166178620, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, orderNo=1, keyword=自适应巡航控制), Keyword(id=1204452613266841930, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, orderNo=2, keyword=柔性演员-评论家), Keyword(id=1204452613455585632, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, orderNo=3, keyword=可迁移性), Keyword(id=1204452613593997681, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, orderNo=4, keyword=深度强化学习)], refs=[Reference(id=1204452618883015558, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2018, volume=45, issue=null, pageStart=18, pageEnd=40, url=null, language=null, rfNumber=[1], rfOrder=0, authorNames=GUANETTI J, KIM Y, BORRELLI F, journalName=Annual Reviews in Control, refType=null, unstructuredReference=
GUANETTI J,
KIM Y,
BORRELLI F. Control of Connected and Automated Vehicles: State of the Art and Future Challenges[J].
Annual Reviews in Control,
2018,
45: 18-40., articleTitle=Control of Connected and Automated Vehicles: State of the Art and Future Challenges, refAbstract=null), Reference(id=1204452619059176337, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2017, volume=45, issue=4, pageStart=544, pageEnd=553, url=null, language=null, rfNumber=[2], rfOrder=1, authorNames=吴光强, 张亮修, 刘兆勇, journalName=同济大学学报(自然科学版), refType=null, unstructuredReference=吴光强, 张亮修, 刘兆勇, 等. 汽车自适应巡航控制系统研究现状与发展趋势[J].
同济大学学报(自然科学版),
2017,
45(4): 544-553., articleTitle=汽车自适应巡航控制系统研究现状与发展趋势, refAbstract=null), Reference(id=1204452619205976984, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2017, volume=45, issue=4, pageStart=544, pageEnd=553, url=null, language=null, rfNumber=[2], rfOrder=2, authorNames=WU G Q, ZHANG L X, LIU Z Y, journalName=Journal of Tongji University (Natural Science), refType=null, unstructuredReference=
WU G Q,
ZHANG L X,
LIU Z Y, et al. Research Status and Development Trend of Vehicle Adaptive Cruise Control Systems[J].
Journal of Tongji University (Natural Science),
2017,
45(4): 544-553., articleTitle=Research Status and Development Trend of Vehicle Adaptive Cruise Control Systems, refAbstract=null), Reference(id=1204452619356971943, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2015, volume=518, issue=null, pageStart=529, pageEnd=533, url=null, language=null, rfNumber=[3], rfOrder=3, authorNames=MNIH V, KAVUKCUOGLU K, SILVER D, journalName=Nature, refType=null, unstructuredReference=
MNIH V,
KAVUKCUOGLU K,
SILVER D, et al. Human-Level Control Through Deep Reinforcement Learning[J].
Nature,
2015,
518: 529-533., articleTitle=Human-Level Control Through Deep Reinforcement Learning, refAbstract=null), Reference(id=1204452619533132723, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2016, volume=33, issue=6, pageStart=701, pageEnd=717, url=null, language=null, rfNumber=[4], rfOrder=4, authorNames=赵冬斌, 邵坤, 朱圆恒, journalName=控制理论与应用, refType=null, unstructuredReference=赵冬斌, 邵坤, 朱圆恒, 等. 深度强化学习综述:兼论计算机围棋的发展[J].
控制理论与应用,
2016,
33(6): 701-717., articleTitle=深度强化学习综述:兼论计算机围棋的发展, refAbstract=null), Reference(id=1204452619650573240, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2016, volume=33, issue=6, pageStart=701, pageEnd=717, url=null, language=null, rfNumber=[4], rfOrder=5, authorNames=ZHAO D B, SHAO K, ZHU Y H, journalName=Control Theory & Applications, refType=null, unstructuredReference=
ZHAO D B,
SHAO K,
ZHU Y H, et al. Review of Deep Reinforcement Learning and Discussions on the Development of Computer Go[J].
Control Theory & Applications,
2016,
33(6): 701-717., articleTitle=Review of Deep Reinforcement Learning and Discussions on the Development of Computer Go, refAbstract=null), Reference(id=1204452619784790980, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2018, volume=41, issue=1, pageStart=1, pageEnd=27, url=null, language=null, rfNumber=[5], rfOrder=6, authorNames=刘全, 翟建伟, 章宗长, journalName=计算机学报, refType=null, unstructuredReference=刘全, 翟建伟, 章宗长, 等. 深度强化学习综述[J].
计算机学报,
2018,
41(1): 1-27., articleTitle=深度强化学习综述, refAbstract=null), Reference(id=1204452619923203026, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2018, volume=41, issue=1, pageStart=1, pageEnd=27, url=null, language=null, rfNumber=[5], rfOrder=7, authorNames=LIU Q, ZHAI J W, ZHANG Z Z, journalName=Chinese Journal of Computers, refType=null, unstructuredReference=
LIU Q,
ZHAI J W,
ZHANG Z Z, et al. A Survey on Deep Reinforcement Learning[J].
Chinese Journal of Computers,
2018,
41(1): 1-27., articleTitle=A Survey on Deep Reinforcement Learning, refAbstract=null), Reference(id=1204452620011283422, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2018, volume=114, issue=null, pageStart=1, pageEnd=18, url=null, language=null, rfNumber=[6], rfOrder=8, authorNames=YOU C X, LU J B, FILEV D, journalName=Robotics and Autonomous Systems, refType=null, unstructuredReference=
YOU C X,
LU J B,
FILEV D, et al. Advanced Planning for Autonomous Vehicles Using Reinforcement Learning and Deep Inverse Reinforcement Learning[J].
Robotics and Autonomous Systems,
2018,
114: 1-18., articleTitle=Advanced Planning for Autonomous Vehicles Using Reinforcement Learning and Deep Inverse Reinforcement Learning, refAbstract=null), Reference(id=1204452620158084076, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2019, volume=7, issue=null, pageStart=165262, pageEnd=165278, url=null, language=null, rfNumber=[7], rfOrder=9, authorNames=ZHOU X Y, WU P, ZHANG H F, journalName=IEEE Access, refType=null, unstructuredReference=
ZHOU X Y,
WU P,
ZHANG H F, et al. Learn to Navigate: Cooperative Path Planning for Unmanned Surface Vehicles Using Deep Reinforcement Learning[J].
IEEE Access,
2019,
7: 165262-165278., articleTitle=Learn to Navigate: Cooperative Path Planning for Unmanned Surface Vehicles Using Deep Reinforcement Learning, refAbstract=null), Reference(id=1204452620279718907, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=94, pageEnd=null, url=null, language=null, rfNumber=[8], rfOrder=10, authorNames=WASALA A, BYRNE D, MIESBAUER P, journalName=Engineering Applications of Artificial Intelligence, refType=null, unstructuredReference=
WASALA A,
BYRNE D,
MIESBAUER P, et al. Trajectory Based Lateral Control: A Reinforcement Learning Case Study[J].
Engineering Applications of Artificial Intelligence,
2020, 94., articleTitle=Trajectory Based Lateral Control: A Reinforcement Learning Case Study, refAbstract=null), Reference(id=1204452620531376136, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=332, pageEnd=337, url=null, language=null, rfNumber=[9], rfOrder=11, authorNames=FEHÉR Á, ARADI S, BÉCSI T, journalName=null, refType=null, unstructuredReference=
FEHÉR Á,
ARADI S,
BÉCSI T, et al. Proving Ground Test of a DDPG-Based Vehicle Trajectory Planner[C]// 2020 European Control Conference (ECC). St. Petersburg: IEEE,
2020: 332-337., articleTitle=null, refAbstract=null), Reference(id=1204452620669788178, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2019, volume=21, issue=11, pageStart=4895, pageEnd=4905, url=null, language=null, rfNumber=[10], rfOrder=12, authorNames=LI G Q, GӦRGES D, journalName=IEEE Transactions on Intelligent Transportation Systems, refType=null, unstructuredReference=
LI G Q,
GӦRGES D. Ecological Adaptive Cruise Control for Vehicles with Step-Gear Transmission Based on Reinforcement Learning[J].
IEEE Transactions on Intelligent Transportation Systems,
2019,
21(11): 4895-4905., articleTitle=Ecological Adaptive Cruise Control for Vehicles with Step-Gear Transmission Based on Reinforcement Learning, refAbstract=null), Reference(id=1204452620871114796, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2019, volume=20, issue=10, pageStart=3796, pageEnd=3805, url=null, language=null, rfNumber=[11], rfOrder=13, authorNames=GAO W N, GAO J Q, OZBAY K, journalName=IEEE Transactions on Intelligent Transportation Systems, refType=null, unstructuredReference=
GAO W N,
GAO J Q,
OZBAY K, et al. Reinforcement- Learning-Based Cooperative Adaptive Cruise Control of Buses in the Lincoln Tunnel Corridor with Time-Varying Topology[J].
IEEE Transactions on Intelligent Transportation Systems,
2019,
20(10): 3796-3805., articleTitle=Reinforcement- Learning-Based Cooperative Adaptive Cruise Control of Buses in the Lincoln Tunnel Corridor with Time-Varying Topology, refAbstract=null), Reference(id=1204452620980166711, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2020, volume=69, issue=6, pageStart=5876, pageEnd=5888, url=null, language=null, rfNumber=[12], rfOrder=14, authorNames=FU Y C, LI C L, YU R, journalName=IEEE Transactions on Vehicular Technology, refType=null, unstructuredReference=
FU Y C,
LI C L,
YU R, et al. A Decision-Making Strategy for Vehicle Autonomous Braking in Emergency via Deep Reinforcement Learning[J].
IEEE Transactions on Vehicular Technology,
2020,
69(6): 5876-5888., articleTitle=A Decision-Making Strategy for Vehicle Autonomous Braking in Emergency via Deep Reinforcement Learning, refAbstract=null), Reference(id=1204452621105995837, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2019, volume=8, issue=12, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[13], rfOrder=15, authorNames=QIAN L L, XU X, ZENG Y J, Deep, journalName=Electronics, refType=null, unstructuredReference=
QIAN L L,
XU X,
ZENG Y J, et al. Deep, Consistent Behavioral Decision Making with Planning Features for Autonomous Vehicles[J].
Electronics,
2019,
8(12)., articleTitle=Consistent Behavioral Decision Making with Planning Features for Autonomous Vehicles, refAbstract=null), Reference(id=1204452621206659143, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=1, pageEnd=5, url=null, language=null, rfNumber=[14], rfOrder=16, authorNames=LIU J, ZHAO L, ZHENG K, journalName=null, refType=null, unstructuredReference=
LIU J,
ZHAO L,
ZHENG K, et al. A Distributed Driving Decision Scheme Based on Reinforcement Learning for Autonomous Driving Vehicles[C]// 2020 IEEE 91st Vehicular Technology Conference (VTC2020-Spring). Antwerp: IEEE,
2020: 1-5., articleTitle=null, refAbstract=null), Reference(id=1204452621307322451, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2020, volume=null, issue=null, pageStart=1, pageEnd=6, url=null, language=null, rfNumber=[15], rfOrder=17, authorNames=HE X K, FEI C, LIU Y L, journalName=null, refType=null, unstructuredReference=
HE X K,
FEI C,
LIU Y L, et al. Multi-Objective Longitudinal Decision-Making for Autonomous Electric Vehicle:A Entropy-Constrained Reinforcement Learning Approach[C]// 2020 IEEE 23rd International Conference on Intelligent Transportation Systems (ITSC). Rhodes: IEEE,
2020: 1-6., articleTitle=null, refAbstract=null), Reference(id=1204452621403791454, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2016, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[16], rfOrder=18, authorNames=刘骝, journalName=基于多目标决策算法和PID控制的CACC系统的优化与仿真, refType=null, unstructuredReference=刘骝.
基于多目标决策算法和PID控制的CACC系统的优化与仿真[D]. 长春: 吉林大学,
2016., articleTitle=null, refAbstract=null), Reference(id=1204452621500260458, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2016, volume=null, issue=null, pageStart=null, pageEnd=null, url=null, language=null, rfNumber=[16], rfOrder=19, authorNames=LIU L, journalName=Optimization and Simulation of CACC System Based on Multi Objective Decision Algorithm and PID Control, refType=null, unstructuredReference=
LIU L.
Optimization and Simulation of CACC System Based on Multi Objective Decision Algorithm and PID Control[D]. Changchun: Jilin University,
2016., articleTitle=null, refAbstract=null), Reference(id=1204452621630283896, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2017, volume=null, issue=null, pageStart=1352, pageEnd=1361, url=null, language=null, rfNumber=[17], rfOrder=20, authorNames=HAARNOJA T, TANG H, ABBEEL P, journalName=International Conference on Machine Learning, refType=null, unstructuredReference=
HAARNOJA T,
TANG H,
ABBEEL P, et al. Reinforcement Learning with Deep Energy-Based Policies[C]//
International Conference on Machine Learning. Sydney: PMLR,
2017: 1352-1361., articleTitle=Reinforcement Learning with Deep Energy-Based Policies, refAbstract=null), Reference(id=1204452621764501638, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2018, volume=null, issue=null, pageStart=1861, pageEnd=1870, url=null, language=null, rfNumber=[18], rfOrder=21, authorNames=HAARNOJA T, ZHOU A, ABBEEL P, journalName=International Conference on Machine Learning. PMLR, refType=null, unstructuredReference=
HAARNOJA T,
ZHOU A,
ABBEEL P, et al. Soft Actor-Critic: Off-Policy Maximum Entropy Deep Reinforcement Learning with a Stochastic Actor[C]//
International Conference on Machine Learning. PMLR,
2018: 1861-1870., articleTitle=Soft Actor-Critic: Off-Policy Maximum Entropy Deep Reinforcement Learning with a Stochastic Actor, refAbstract=null), Reference(id=1204452621911302293, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2010, volume=50, issue=5, pageStart=645, pageEnd=648, url=null, language=null, rfNumber=[19], rfOrder=22, authorNames=李升波, 王建强, 李克强, journalName=清华大学学报(自然科学版), refType=null, unstructuredReference=李升波, 王建强, 李克强, 等. MPC实用化问题处理及在车辆ACC中的应用[J].
清华大学学报(自然科学版),
2010,
50(5): 645-648., articleTitle=MPC实用化问题处理及在车辆ACC中的应用, refAbstract=null), Reference(id=1204452622003576996, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=2010, volume=50, issue=5, pageStart=645, pageEnd=648, url=null, language=null, rfNumber=[19], rfOrder=23, authorNames=LI S B, WANG J Q, LI K Q, journalName=Journal of Tsinghua University (Science and Technology), refType=null, unstructuredReference=
LI S B,
WANG J Q,
LI K Q, et al. Processing of MPC Practical Problems and Its Application to Vehicular Adaptive Cruise Control Systems[J].
Journal of Tsinghua University (Science and Technology),
2010,
50(5): 645-648., articleTitle=Processing of MPC Practical Problems and Its Application to Vehicular Adaptive Cruise Control Systems, refAbstract=null), Reference(id=1204452622108434606, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, doi=null, pmid=null, pmcid=null, year=1999, volume=null, issue=null, pageStart=278, pageEnd=287, url=null, language=null, rfNumber=[20], rfOrder=24, authorNames=NG A Y, HARADA D, RUSSELL S, journalName=Proceedings of the Sixteenth International Conference on Machine Learning. ICML, refType=null, unstructuredReference=
NG A Y,
HARADA D,
RUSSELL S. Policy Invariance under Reward Transformations: Theory and Application to Reward Shaping[C]//
Proceedings of the Sixteenth International Conference on Machine Learning. ICML,
1999: 278-287., articleTitle=Policy Invariance under Reward Transformations: Theory and Application to Reward Shaping, refAbstract=null)], funds=[Fund(id=1204452618610385763, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, awardId=2019B090912001, language=CN, fundingSource=* 广东省重点领域研发项目(2019B090912001), fundOrder=null, country=null)], companyList=[AuthorCompany(id=1204452610192417745, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, xref=1, ext=[AuthorCompanyExt(id=1204452610209194965, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, companyId=1204452610192417745, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 South China University of Technology, Guangzhou 510641), AuthorCompanyExt(id=1204452610217583574, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, companyId=1204452610192417745, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
1 华南理工大学,广州 510641)]), AuthorCompany(id=1204452610393744363, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, xref=2, ext=[AuthorCompanyExt(id=1204452610414715887, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, companyId=1204452610393744363, language=EN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2 State Key Laboratory of Advanced Design and Manufacturing for Vehicle Body, Hunan University, Changsha 410082), AuthorCompanyExt(id=1204452610439881712, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, companyId=1204452610393744363, language=CN, country=null, province=null, city=null, postcode=null, companyName=null, departmentName=null, remark=
2 湖南大学,汽车车身先进设计制造国家重点实验室,长沙 410082)])], figs=[ArticleFig(id=1204452613824684431, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, label=null, caption=null, figureFileSmall=xaagxvDBdncWcKy0UlveXg==, figureFileBig=N/6bB3s1uw1CDsHjdiXXWg==, tableContent=null), ArticleFig(id=1204452613933736347, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, label=图1, caption=
车辆自适应巡航场景示意, figureFileSmall=xaagxvDBdncWcKy0UlveXg==, figureFileBig=N/6bB3s1uw1CDsHjdiXXWg==, tableContent=null), ArticleFig(id=1204452614105702836, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, label=null, caption=null, figureFileSmall=4yTqAUKC5yZG3ZG5Z9JyQQ==, figureFileBig=onul+3CUGG3Qwj5MceOm8g==, tableContent=null), ArticleFig(id=1204452614290252226, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, label=图2, caption=
自适应巡航控制DRL过程, figureFileSmall=4yTqAUKC5yZG3ZG5Z9JyQQ==, figureFileBig=onul+3CUGG3Qwj5MceOm8g==, tableContent=null), ArticleFig(id=1204452614399304139, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, label=null, caption=null, figureFileSmall=28hbeC11sYrOcKubEcabMg==, figureFileBig=XVDRITiErMae49wL4fyWWQ==, tableContent=null), ArticleFig(id=1204452614529327581, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, label=图3, caption=
动作值网络, figureFileSmall=28hbeC11sYrOcKubEcabMg==, figureFileBig=XVDRITiErMae49wL4fyWWQ==, tableContent=null), ArticleFig(id=1204452614629990891, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, label=null, caption=null, figureFileSmall=JtlcBLZlSh20Kvw26fWOSQ==, figureFileBig=j7qYep1iACNWr0vxFLqC+A==, tableContent=null), ArticleFig(id=1204452614743237115, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, label=图4, caption=
动作策略网络, figureFileSmall=JtlcBLZlSh20Kvw26fWOSQ==, figureFileBig=j7qYep1iACNWr0vxFLqC+A==, tableContent=null), ArticleFig(id=1204452614877454859, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, label=null, caption=null, figureFileSmall=0oPe2oAfGX75fQ5nNmGnEg==, figureFileBig=8OFyST/nTDeya/PNu0pq7A==, tableContent=null), ArticleFig(id=1204452615041032732, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, label=图5, caption=
基础奖励分布, figureFileSmall=0oPe2oAfGX75fQ5nNmGnEg==, figureFileBig=8OFyST/nTDeya/PNu0pq7A==, tableContent=null), ArticleFig(id=1204452615133307433, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, label=null, caption=null, figureFileSmall=IdaYksc0ZF/0pdk+MZPrrA==, figureFileBig=PP+khPA/ajVjARu6Q5XUjQ==, tableContent=null), ArticleFig(id=1204452615322051130, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, label=图6, caption=
细化奖励函数, figureFileSmall=IdaYksc0ZF/0pdk+MZPrrA==, figureFileBig=PP+khPA/ajVjARu6Q5XUjQ==, tableContent=null), ArticleFig(id=1204452615464657477, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, label=null, caption=null, figureFileSmall=38aWVttl8mxJD8R+BsXIzg==, figureFileBig=38zfaCsnLLdbw9vxf+ZYEQ==, tableContent=null), ArticleFig(id=1204452615565320785, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, label=图7, caption=
目标车行驶工况, figureFileSmall=38aWVttl8mxJD8R+BsXIzg==, figureFileBig=38zfaCsnLLdbw9vxf+ZYEQ==, tableContent=null), ArticleFig(id=1204452615678567006, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, label=null, caption=null, figureFileSmall=b8FPEnSuJqCR3z+cbF57Pw==, figureFileBig=e2ziE2URsyq+clJu+BpRjw==, tableContent=null), ArticleFig(id=1204452615808590441, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, label=图8, caption=
DRL模型训练结果, figureFileSmall=b8FPEnSuJqCR3z+cbF57Pw==, figureFileBig=e2ziE2URsyq+clJu+BpRjw==, tableContent=null), ArticleFig(id=1204452615926030962, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, label=null, caption=null, figureFileSmall=3ESdQlBF50YUHG/dNFreAw==, figureFileBig=hXfexjFwncChadNvFOAPFg==, tableContent=null), ArticleFig(id=1204452616102191748, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, label=图9, caption=
目标车静止场景下主车的状态曲线, figureFileSmall=3ESdQlBF50YUHG/dNFreAw==, figureFileBig=hXfexjFwncChadNvFOAPFg==, tableContent=null), ArticleFig(id=1204452616219632278, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, label=null, caption=null, figureFileSmall=55sM2meQ9CP/42lCE+DAQw==, figureFileBig=uLK5asrq1hmgl44rRURKtA==, tableContent=null), ArticleFig(id=1204452616320295587, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, label=图10, caption=
目标车低速场景下主车的状态曲线, figureFileSmall=55sM2meQ9CP/42lCE+DAQw==, figureFileBig=uLK5asrq1hmgl44rRURKtA==, tableContent=null), ArticleFig(id=1204452616433541806, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, label=null, caption=null, figureFileSmall=77LZHzfIE2Q8faXCj1NWCQ==, figureFileBig=KD2zq8xL1Ax6i8QCU0PHjA==, tableContent=null), ArticleFig(id=1204452616580342455, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, label=图11, caption=
目标车减速场景下主车的状态曲线, figureFileSmall=77LZHzfIE2Q8faXCj1NWCQ==, figureFileBig=KD2zq8xL1Ax6i8QCU0PHjA==, tableContent=null), ArticleFig(id=1204452616718754501, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, label=null, caption=null, figureFileSmall=lONwVK4oJyl+cV9cEpZoiw==, figureFileBig=7DL5VRIrDSCEOTAdAdeG2w==, tableContent=null), ArticleFig(id=1204452616899109590, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, label=图12, caption=
试验路线, figureFileSmall=lONwVK4oJyl+cV9cEpZoiw==, figureFileBig=7DL5VRIrDSCEOTAdAdeG2w==, tableContent=null), ArticleFig(id=1204452617029133023, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, label=null, caption=null, figureFileSmall=ig5S/3f9FgGlWiszcdkmyA==, figureFileBig=Tz7XEzpUZq1tm+STwtJq5w==, tableContent=null), ArticleFig(id=1204452617146573546, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, label=图13, caption=
试验主车和场景示意, figureFileSmall=ig5S/3f9FgGlWiszcdkmyA==, figureFileBig=Tz7XEzpUZq1tm+STwtJq5w==, tableContent=null), ArticleFig(id=1204452617284985589, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, label=null, caption=null, figureFileSmall=voSRHQDdQFkP3udSi6t9Nw==, figureFileBig=HCXmTrZuszZ9hjc0kpSenw==, tableContent=null), ArticleFig(id=1204452617410814715, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, label=图14, caption=
试验主车状态曲线, figureFileSmall=voSRHQDdQFkP3udSi6t9Nw==, figureFileBig=HCXmTrZuszZ9hjc0kpSenw==, tableContent=null), ArticleFig(id=1204452617561809673, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, label=null, caption=null, figureFileSmall=null, figureFileBig=null, tableContent=
| 超参数 | 数值 | 超参数 | 数值 |
| 折扣因子γ | 0.995 | 神经网络 学习率lr | 0.000 1 |
| 软更新系数τ | 0.02 | 初始温度系数α0 | 0.2 |
| 批量大小 | 32 | 奖励缩聚因子χ | 0.000 1 |
经验缓存池最大 容量Cmax | 100 000 | | |
), ArticleFig(id=1204452617708610333, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, label=表1, caption=
算法超参数
, figureFileSmall=null, figureFileBig=null, tableContent=
| 超参数 | 数值 | 超参数 | 数值 |
| 折扣因子γ | 0.995 | 神经网络 学习率lr | 0.000 1 |
| 软更新系数τ | 0.02 | 初始温度系数α0 | 0.2 |
| 批量大小 | 32 | 奖励缩聚因子χ | 0.000 1 |
经验缓存池最大 容量Cmax | 100 000 | | |
), ArticleFig(id=1204452617847022376, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, label=null, caption=null, figureFileSmall=null, figureFileBig=null, tableContent=
| 场景 | 主车初速度 /km·h-1 | 时间步 |
| SAC | DDPG |
| 目标车静止 | 30 | 464 | 573 |
| 60 | 421 | 542 |
| 目标车低速 | 80 | 388 | 447 |
| 120 | 362 | 436 |
| 目标车减速 | 120 | 401 | 499 |
), ArticleFig(id=1204452618006405943, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, label=表2, caption=
不同场景下速度误差收敛至稳定状态所用的时间步
, figureFileSmall=null, figureFileBig=null, tableContent=
| 场景 | 主车初速度 /km·h-1 | 时间步 |
| SAC | DDPG |
| 目标车静止 | 30 | 464 | 573 |
| 60 | 421 | 542 |
| 目标车低速 | 80 | 388 | 447 |
| 120 | 362 | 436 |
| 目标车减速 | 120 | 401 | 499 |
), ArticleFig(id=1204452618136429379, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=EN, label=null, caption=null, figureFileSmall=null, figureFileBig=null, tableContent=
| 场景 | 主车初速度/km·h-1 | 冲击度(绝对值)均值/m·s-3 | 冲击度(绝对值)最值/m·s-3 |
| SAC | DDPG | SAC | DDPG |
| 目标车静止 | 30 | 9.73 | 13.01 | 62.57 | 145.80 |
| 60 | 10.59 | 13.04 | 73.87 | 138.92 |
| 目标车低速 | 80 | 12.00 | 15.77 | 48.45 | 195.31 |
| 120 | 13.52 | 14.23 | 149.21 | 242.01 |
| 目标车减速 | 120 | 14.15 | 26.32 | 110.32 | 256.98 |
), ArticleFig(id=1204452618300007247, tenantId=1146029695717560320, journalId=1189621681917173762, articleId=1204385487667568928, language=CN, label=表3, caption=
不同场景下主车冲击度(绝对值)均值和最值
, figureFileSmall=null, figureFileBig=null, tableContent=
| 场景 | 主车初速度/km·h-1 | 冲击度(绝对值)均值/m·s-3 | 冲击度(绝对值)最值/m·s-3 |
| SAC | DDPG | SAC | DDPG |
| 目标车静止 | 30 | 9.73 | 13.01 | 62.57 | 145.80 |
| 60 | 10.59 | 13.04 | 73.87 | 138.92 |
| 目标车低速 | 80 | 12.00 | 15.77 | 48.45 | 195.31 |
| 120 | 13.52 | 14.23 | 149.21 | 242.01 |
| 目标车减速 | 120 | 14.15 | 26.32 | 110.32 | 256.98 |
)], attaches=null, journal=Journal(id=1149693407745847311, delFlag=0, nameCn=汽车技术, nameEn=Automobile Technology, nameHistory1=null, nameHistory2=null, issn=1000-3703, eissn=null, cn=22-1113/U, coden=null, periodic=0, language=CN, oaType=null, ccby=null, superviseOffice=null, ownerOffice=null, pubOffice=null, editorOffice=null, officeType=null, aims=null, clcCode=null, officeProv=null, officeCity=null, officeAddr=null, officeZip=null, officeEmail=null, officePhone=null, editDirector=null, officeDirector=null, officeDirectorPhone=null, officeStaffNum=null, officeEmpNum=null, coverPicUrl=rYFtDx/CU9+iX8QTM0ckbw==, journalPrice=null, startedYear=null, abbrevIsoEn=null, journalRemark=null, publicationField=null, createdTime=1752037868679, updatedTime=1761735668047, createdBy=18614031015, updatedBy=13701087609, firstLetterCn=A, firstLetterEn=A, subjectCode=Engineering, subjectName=Engineering, subjectCodeEn=Engineering, subjectNameEn=null, picCn=rYFtDx/CU9+iX8QTM0ckbw==, picEn=oFT2NmUwKPUjZ27C1+d9pw==, jcr=null, cjcr=null, exts=[JournalExt(id=1190368926564450443, language=CN, name=汽车技术, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=, createdTime=1761735668078, updatedTime=1761735668078, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=https://qcjs.cbpt.cnki.net/index.aspx?t=1, submissionEditorUrl=https://qcjs.cbpt.cnki.net/index.aspx?t=3, submissionReviewUrl=https://qcjs.cbpt.cnki.net/index.aspx?t=2, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""}), JournalExt(id=1190368926618976396, language=EN, name=Automobile Technology, nameHistory1=null, nameHistory2=null, managedBy=, sponsoredBy=, publishedBy=, editorOffice=, officeProv=null, officeCity=null, officeAddr=, officeZip=, editDirector=, officeDirector=null, officePhone=null, coverPicUrl=null, journalRemark=, submitArticleUrl=null, websiteUrl=, createdTime=1761735668091, updatedTime=1761735668091, createdBy=13701087609, updatedBy=13701087609, submissionGuidelinesUrl=, submissionAuthorUrl=https://qcjs.cbpt.cnki.net/index.aspx?t=1, submissionEditorUrl=https://qcjs.cbpt.cnki.net/index.aspx?t=3, submissionReviewUrl=https://qcjs.cbpt.cnki.net/index.aspx?t=2, submissionCeEditorUrl=, submissionAeEditorUrl=, option={"copyright":""})], databaseList=null, tenantJournalId=1189621681917173762, websiteList=[Website(id=1189624193747526544, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1189621681917173762, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/qcjs/CN, language=CN, createTime=1761558109939, createBy=18614031015, updateTime=1761558140534, updateBy=18614031015, name=汽车技术-中, tplId=1146099689490845704, title=汽车技术, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1189625424704451180, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1189624193747526544, code=articleTextType, value=kx, createTime=1761558403421, updateTime=1761558403421, creator=18614031015, updator=18614031015), WebsiteProps(id=1189625424675091049, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1189624193747526544, code=banner, value=null, createTime=1761558403414, updateTime=1761558403414, creator=18614031015, updator=18614031015), WebsiteProps(id=1189625424733811311, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1189624193747526544, code=grayFlag, value=0, createTime=1761558403428, updateTime=1761558403428, creator=18614031015, updator=18614031015), WebsiteProps(id=1189625424658313832, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1189624193747526544, code=logo, value=https://castjournals.cast.org.cn/joweb/qcjs/CN/file/pic?fileId=7En9rzX2QCa/1J8NnKt/Fg==, createTime=1761558403410, updateTime=1761558403410, creator=18614031015, updator=18614031015), WebsiteProps(id=1189625424746394225, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1189624193747526544, code=minRunFlag, value=0, createTime=1761558403431, updateTime=1761558403431, creator=18614031015, updator=18614031015), WebsiteProps(id=1189625424691868267, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1189624193747526544, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/qcjs/CN/file/pic, createTime=1761558403418, updateTime=1761558403418, creator=18614031015, updator=18614031015), WebsiteProps(id=1189625424742199920, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1189624193747526544, code=silenceFlag, value=0, createTime=1761558403430, updateTime=1761558403430, creator=18614031015, updator=18614031015), WebsiteProps(id=1189625424683479658, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1189624193747526544, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_cn_619/, createTime=1761558403416, updateTime=1761558403416, creator=18614031015, updator=18614031015), WebsiteProps(id=1189625424712839789, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1189624193747526544, code=themeColor, value=null, createTime=1761558403423, updateTime=1761558403423, creator=18614031015, updator=18614031015), WebsiteProps(id=1189625424725422702, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1189624193747526544, code=themeStyle, value=null, createTime=1761558403426, updateTime=1761558403426, creator=18614031015, updator=18614031015)]), Website(id=1189624193869161363, webName=null, webTitle=null, webDomain=null, webCopyrigh=null, webIpcNo=null, seoTitle=null, seoKeywords=null, seoDescription=null, tenantJournalId=null, journalId=1189621681917173762, journalNameCn=null, journalNameEn=null, grayFlag=null, tenantId=1146029695717560320, platformId=null, journalGroupId=null, journalGroupNameCn=null, journalGroupNameEn=null, type=1, domain=https://castjournals.cast.org.cn/joweb/qcjs/EN, language=EN, createTime=1761558109967, createBy=18614031015, updateTime=1761558340679, updateBy=18614031015, name=汽车技术-英文, tplId=1146101810881728533, title=Automobile Technology, delFlag=0, indexPage=/home, props=[WebsiteProps(id=1189625550722311064, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1189624193869161363, code=articleTextType, value=kx, createTime=1761558433466, updateTime=1761558433466, creator=18614031015, updator=18614031015), WebsiteProps(id=1189625550688756629, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1189624193869161363, code=banner, value=null, createTime=1761558433458, updateTime=1761558433458, creator=18614031015, updator=18614031015), WebsiteProps(id=1189625550739088283, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1189624193869161363, code=grayFlag, value=0, createTime=1761558433470, updateTime=1761558433470, creator=18614031015, updator=18614031015), WebsiteProps(id=1189625550676173716, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1189624193869161363, code=logo, value=https://castjournals.cast.org.cn/joweb/qcjs/EN/file/pic?fileId=7En9rzX2QCa/1J8NnKt/Fg==, createTime=1761558433455, updateTime=1761558433455, creator=18614031015, updator=18614031015), WebsiteProps(id=1189625550751671197, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1189624193869161363, code=minRunFlag, value=0, createTime=1761558433473, updateTime=1761558433473, creator=18614031015, updator=18614031015), WebsiteProps(id=1189625550713922455, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1189624193869161363, code=picServerUrl, value=https://castjournals.cast.org.cn/joweb/qcjs/EN/file/pic, createTime=1761558433464, updateTime=1761558433464, creator=18614031015, updator=18614031015), WebsiteProps(id=1189625550743282588, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1189624193869161363, code=silenceFlag, value=0, createTime=1761558433471, updateTime=1761558433471, creator=18614031015, updator=18614031015), WebsiteProps(id=1189625550705533846, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1189624193869161363, code=staticResourcePath, value=https://castjournals.cast.org.cn/joweb/cast_kjdb_en_623/, createTime=1761558433462, updateTime=1761558433462, creator=18614031015, updator=18614031015), WebsiteProps(id=1189625550726505369, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1189624193869161363, code=themeColor, value=null, createTime=1761558433467, updateTime=1761558433467, creator=18614031015, updator=18614031015), WebsiteProps(id=1189625550734893978, tenantId=1146029695717560320, journalId=null, journalGroupId=null, siteId=1189624193869161363, code=themeStyle, value=null, createTime=1761558433469, updateTime=1761558433469, creator=18614031015, updator=18614031015)])], journalTitle=汽车技术, weixinUrl=null, journalUrl=null, iacademicId=null, status=1, seqNo=null, journalTitleEn=Automobile Technology, journalPhotoCn=rYFtDx/CU9+iX8QTM0ckbw==, journalPhotoEn=oFT2NmUwKPUjZ27C1+d9pw==, journalFirstLetter=A, journalRecommend=null, journalNew=null, journalCollection=null, jcrJf=null, cjcrJf=null, jcrJfStr=null, cjcrJfStr=null, submissionFirstDecision=null, sciSubjectClassification=null, casSubjectClassification=null, citeScore=null, totalCitationFrequency=null, icpCode=null, psCode=null, advertisingLicenseCode=null, copyrightInformation=null, country=null, option=, provinceCode=null, provinceName=null, collectFlag=false), detailUrlCn=https://castjournals.cast.org.cn/joweb/qcjs/CN/10.19620/j.cnki.1000-3703.20220500, detailUrlEn=https://castjournals.cast.org.cn/joweb/qcjs/EN/10.19620/j.cnki.1000-3703.20220500, pdfUrlCn=https://castjournals.cast.org.cn/joweb/qcjs/CN/PDF/10.19620/j.cnki.1000-3703.20220500, pdfUrlEn=https://castjournals.cast.org.cn/joweb/qcjs/EN/PDF/10.19620/j.cnki.1000-3703.20220500, aliStartDate=null, aliEndDate=null, collectionFlag=false, citedCount=null, citedUrl=null, reference=null)