<?xml version="1.0" encoding="utf-8" standalone="no"?>
<dublin_core schema="dc">
<dcvalue element="contributor" qualifier="author">Kim,&#x20;Yu-Jin</dcvalue>
<dcvalue element="contributor" qualifier="author">Ahn,&#x20;Woo-Jin</dcvalue>
<dcvalue element="contributor" qualifier="author">Jang,&#x20;Sun-Ho</dcvalue>
<dcvalue element="contributor" qualifier="author">Lim,&#x20;Myo-Taeg</dcvalue>
<dcvalue element="contributor" qualifier="author">Pae,&#x20;Dong-Sung</dcvalue>
<dcvalue element="date" qualifier="accessioned">2024-07-11T06:01:23Z</dcvalue>
<dcvalue element="date" qualifier="available">2024-07-11T06:01:23Z</dcvalue>
<dcvalue element="date" qualifier="created">2024-07-11</dcvalue>
<dcvalue element="date" qualifier="issued">2024-06</dcvalue>
<dcvalue element="identifier" qualifier="uri">https:&#x2F;&#x2F;pubs.kist.re.kr&#x2F;handle&#x2F;201004&#x2F;150216</dcvalue>
<dcvalue element="description" qualifier="abstract">Goal-conditioned&#x20;Reinforcement&#x20;Learning&#x20;(RL)&#x20;holds&#x20;promise&#x20;for&#x20;addressing&#x20;intricate&#x20;control&#x20;challenges&#x20;by&#x20;enabling&#x20;agents&#x20;to&#x20;learn&#x20;and&#x20;execute&#x20;desired&#x20;skills&#x20;through&#x20;separate&#x20;decision&#x20;modules.&#x20;However,&#x20;the&#x20;irregular&#x20;occurrence&#x20;of&#x20;required&#x20;skills&#x20;poses&#x20;a&#x20;significant&#x20;challenge&#x20;to&#x20;effective&#x20;learning.&#x20;In&#x20;this&#x20;paper,&#x20;we&#x20;demonstrate&#x20;the&#x20;detrimental&#x20;effects&#x20;of&#x20;this&#x20;imbalanced&#x20;skill&#x20;(sub-goal)&#x20;distribution&#x20;and&#x20;propose&#x20;a&#x20;novel&#x20;training&#x20;approach,&#x20;Classified&#x20;Experience&#x20;Replay&#x20;(CER),&#x20;designed&#x20;to&#x20;mitigate&#x20;this&#x20;challenge.&#x20;We&#x20;demonstrate&#x20;that&#x20;adapting&#x20;our&#x20;method&#x20;to&#x20;conventional&#x20;RL&#x20;methods&#x20;significantly&#x20;enhances&#x20;the&#x20;performance&#x20;of&#x20;the&#x20;RL&#x20;agent.&#x20;Considering&#x20;the&#x20;challenges&#x20;inherent&#x20;in&#x20;tasks&#x20;such&#x20;as&#x20;driving,&#x20;characterized&#x20;by&#x20;biased&#x20;occurrences&#x20;of&#x20;required&#x20;sub-goals,&#x20;our&#x20;study&#x20;demonstrates&#x20;the&#x20;improvement&#x20;in&#x20;trained&#x20;outcomes&#x20;facilitated&#x20;by&#x20;the&#x20;proposed&#x20;method.&#x20;In&#x20;addition,&#x20;we&#x20;introduce&#x20;a&#x20;specialized&#x20;framework&#x20;tailored&#x20;for&#x20;self-driving&#x20;tasks&#x20;on&#x20;highways,&#x20;integrating&#x20;model&#x20;predictive&#x20;control&#x20;into&#x20;our&#x20;RL&#x20;trajectory&#x20;optimization&#x20;training&#x20;paradigm.&#x20;Our&#x20;approach,&#x20;utilizing&#x20;CER&#x20;with&#x20;the&#x20;suggested&#x20;framework,&#x20;yields&#x20;remarkable&#x20;advancements&#x20;in&#x20;trajectory&#x20;optimization&#x20;for&#x20;RL&#x20;agents&#x20;operating&#x20;in&#x20;highway&#x20;environments.</dcvalue>
<dcvalue element="language" qualifier="none">English</dcvalue>
<dcvalue element="publisher" qualifier="none">MDPI</dcvalue>
<dcvalue element="title" qualifier="none">A&#x20;Reinforcement&#x20;Learning&#x20;Approach&#x20;to&#x20;Dynamic&#x20;Trajectory&#x20;Optimization&#x20;with&#x20;Consideration&#x20;of&#x20;Imbalanced&#x20;Sub-Goals&#x20;in&#x20;Self-Driving&#x20;Vehicles</dcvalue>
<dcvalue element="type" qualifier="none">Article</dcvalue>
<dcvalue element="identifier" qualifier="doi">10.3390&#x2F;app14125213</dcvalue>
<dcvalue element="description" qualifier="journalClass">1</dcvalue>
<dcvalue element="identifier" qualifier="bibliographicCitation">Applied&#x20;Sciences-basel,&#x20;v.14,&#x20;no.12</dcvalue>
<dcvalue element="citation" qualifier="title">Applied&#x20;Sciences-basel</dcvalue>
<dcvalue element="citation" qualifier="volume">14</dcvalue>
<dcvalue element="citation" qualifier="number">12</dcvalue>
<dcvalue element="description" qualifier="isOpenAccess">Y</dcvalue>
<dcvalue element="description" qualifier="journalRegisteredClass">scie</dcvalue>
<dcvalue element="identifier" qualifier="wosid">001254443800001</dcvalue>
<dcvalue element="identifier" qualifier="scopusid">2-s2.0-85197244022</dcvalue>
<dcvalue element="relation" qualifier="journalWebOfScienceCategory">Chemistry,&#x20;Multidisciplinary</dcvalue>
<dcvalue element="relation" qualifier="journalWebOfScienceCategory">Engineering,&#x20;Multidisciplinary</dcvalue>
<dcvalue element="relation" qualifier="journalWebOfScienceCategory">Materials&#x20;Science,&#x20;Multidisciplinary</dcvalue>
<dcvalue element="relation" qualifier="journalWebOfScienceCategory">Physics,&#x20;Applied</dcvalue>
<dcvalue element="relation" qualifier="journalResearchArea">Chemistry</dcvalue>
<dcvalue element="relation" qualifier="journalResearchArea">Engineering</dcvalue>
<dcvalue element="relation" qualifier="journalResearchArea">Materials&#x20;Science</dcvalue>
<dcvalue element="relation" qualifier="journalResearchArea">Physics</dcvalue>
<dcvalue element="type" qualifier="docType">Article</dcvalue>
<dcvalue element="subject" qualifier="keywordAuthor">reinforcement&#x20;learning</dcvalue>
<dcvalue element="subject" qualifier="keywordAuthor">experience&#x20;replay</dcvalue>
<dcvalue element="subject" qualifier="keywordAuthor">self-driving</dcvalue>
<dcvalue element="subject" qualifier="keywordAuthor">trajectory&#x20;optimization</dcvalue>
</dublin_core>
