<?xml version="1.0" encoding="utf-8" standalone="no"?>
<dublin_core schema="dc">
<dcvalue element="contributor" qualifier="author">Lawler,&#x20;Robin</dcvalue>
<dcvalue element="contributor" qualifier="author">Liu,&#x20;Yao-Hao</dcvalue>
<dcvalue element="contributor" qualifier="author">Majaya,&#x20;Nessa</dcvalue>
<dcvalue element="contributor" qualifier="author">Allam,&#x20;Omar</dcvalue>
<dcvalue element="contributor" qualifier="author">Ju,&#x20;Hyunchul</dcvalue>
<dcvalue element="contributor" qualifier="author">Kim,&#x20;Jin&#x20;Young</dcvalue>
<dcvalue element="contributor" qualifier="author">Jang,&#x20;Seung&#x20;Soon</dcvalue>
<dcvalue element="date" qualifier="accessioned">2024-01-19T13:32:51Z</dcvalue>
<dcvalue element="date" qualifier="available">2024-01-19T13:32:51Z</dcvalue>
<dcvalue element="date" qualifier="created">2022-01-10</dcvalue>
<dcvalue element="date" qualifier="issued">2021-10-07</dcvalue>
<dcvalue element="identifier" qualifier="issn">1089-5639</dcvalue>
<dcvalue element="identifier" qualifier="uri">https:&#x2F;&#x2F;pubs.kist.re.kr&#x2F;handle&#x2F;201004&#x2F;116268</dcvalue>
<dcvalue element="description" qualifier="abstract">In&#x20;this&#x20;study,&#x20;we&#x20;propose&#x20;a&#x20;novel&#x20;method&#x20;of&#x20;pK(a)&#x20;prediction&#x20;in&#x20;a&#x20;diverse&#x20;set&#x20;of&#x20;acids,&#x20;which&#x20;combines&#x20;density&#x20;functional&#x20;theory&#x20;(DFT)&#x20;method&#x20;with&#x20;machine&#x20;learning&#x20;(ML)&#x20;methods.&#x20;First,&#x20;the&#x20;DFT&#x20;method&#x20;with&#x20;B3LYP&#x2F;6-31++G**&#x2F;SM8&#x20;is&#x20;used&#x20;to&#x20;predict&#x20;pK(a),&#x20;yielding&#x20;a&#x20;mean&#x20;absolute&#x20;error&#x20;of&#x20;1.85&#x20;pK(a)&#x20;units.&#x20;Subsequently,&#x20;such&#x20;pK(a)&#x20;values&#x20;predicted&#x20;from&#x20;the&#x20;DFT&#x20;method&#x20;are&#x20;employed&#x20;as&#x20;one&#x20;of&#x20;10&#x20;molecular&#x20;descriptors&#x20;for&#x20;developing&#x20;ML&#x20;models&#x20;trained&#x20;on&#x20;experimental&#x20;data.&#x20;Kernel&#x20;Ridge&#x20;Regression&#x20;(KRR),&#x20;Gaussian&#x20;Process&#x20;Regression,&#x20;and&#x20;Artificial&#x20;Neural&#x20;Network&#x20;are&#x20;optimized&#x20;using&#x20;three&#x20;Pipelines:&#x20;Pipeline&#x20;1&#x20;involving&#x20;only&#x20;hyperparameter&#x20;optimization&#x20;(HPO),&#x20;Pipeline&#x20;2&#x20;involving&#x20;HPO&#x20;followed&#x20;by&#x20;a&#x20;relative&#x20;contribution&#x20;analysis&#x20;(RCA)&#x20;and&#x20;recursive&#x20;feature&#x20;elimination&#x20;(RFE),&#x20;and&#x20;Pipeline&#x20;3&#x20;involving&#x20;HPO&#x20;followed&#x20;by&#x20;RCA&#x20;and&#x20;RFE&#x20;on&#x20;an&#x20;expanded&#x20;set&#x20;of&#x20;composite&#x20;features.&#x20;Finally,&#x20;it&#x20;is&#x20;demonstrated&#x20;that&#x20;KRR&#x20;with&#x20;Pipeline&#x20;3&#x20;yields&#x20;optimal&#x20;pK(a)&#x20;prediction&#x20;at&#x20;an&#x20;MAE&#x20;of&#x20;0.60&#x20;log&#x20;units.&#x20;This&#x20;algorithm&#x20;was&#x20;then&#x20;utilized&#x20;to&#x20;predict&#x20;the&#x20;pKa&#x20;of&#x20;37&#x20;novel&#x20;acids.&#x20;The&#x20;two&#x20;most&#x20;important&#x20;features&#x20;were&#x20;determined&#x20;to&#x20;be&#x20;the&#x20;number&#x20;of&#x20;hydrogen&#x20;atoms&#x20;in&#x20;the&#x20;molecule&#x20;and&#x20;the&#x20;degree&#x20;of&#x20;oxidation&#x20;of&#x20;the&#x20;acid.&#x20;The&#x20;predicted&#x20;pKa&#x20;values&#x20;were&#x20;documented&#x20;for&#x20;future&#x20;reference.</dcvalue>
<dcvalue element="language" qualifier="none">English</dcvalue>
<dcvalue element="publisher" qualifier="none">AMER&#x20;CHEMICAL&#x20;SOC</dcvalue>
<dcvalue element="subject" qualifier="none">ACID&#x20;DISSOCIATION-CONSTANTS</dcvalue>
<dcvalue element="subject" qualifier="none">DENSITY-FUNCTIONAL&#x20;METHODS</dcvalue>
<dcvalue element="subject" qualifier="none">SOLVATION&#x20;FREE-ENERGIES</dcvalue>
<dcvalue element="subject" qualifier="none">COMPLETE&#x20;BASIS-SET</dcvalue>
<dcvalue element="subject" qualifier="none">PHOSPHONIC&#x20;ACID</dcvalue>
<dcvalue element="subject" qualifier="none">PROTON&#x20;CONDUCTIVITY</dcvalue>
<dcvalue element="subject" qualifier="none">PROTOGENIC&#x20;GROUP</dcvalue>
<dcvalue element="subject" qualifier="none">NEURAL-NETWORKS</dcvalue>
<dcvalue element="subject" qualifier="none">SULFONIC-ACID</dcvalue>
<dcvalue element="subject" qualifier="none">VALUES</dcvalue>
<dcvalue element="title" qualifier="none">DFT-Machine&#x20;Learning&#x20;Approach&#x20;for&#x20;Accurate&#x20;Prediction&#x20;of&#x20;pK(a)</dcvalue>
<dcvalue element="type" qualifier="none">Article</dcvalue>
<dcvalue element="identifier" qualifier="doi">10.1021&#x2F;acs.jpca.1c05031</dcvalue>
<dcvalue element="description" qualifier="journalClass">1</dcvalue>
<dcvalue element="identifier" qualifier="bibliographicCitation">JOURNAL&#x20;OF&#x20;PHYSICAL&#x20;CHEMISTRY&#x20;A,&#x20;v.125,&#x20;no.39,&#x20;pp.8712&#x20;-&#x20;8722</dcvalue>
<dcvalue element="citation" qualifier="title">JOURNAL&#x20;OF&#x20;PHYSICAL&#x20;CHEMISTRY&#x20;A</dcvalue>
<dcvalue element="citation" qualifier="volume">125</dcvalue>
<dcvalue element="citation" qualifier="number">39</dcvalue>
<dcvalue element="citation" qualifier="startPage">8712</dcvalue>
<dcvalue element="citation" qualifier="endPage">8722</dcvalue>
<dcvalue element="description" qualifier="journalRegisteredClass">scie</dcvalue>
<dcvalue element="description" qualifier="journalRegisteredClass">scopus</dcvalue>
<dcvalue element="identifier" qualifier="wosid">000707037900020</dcvalue>
<dcvalue element="identifier" qualifier="scopusid">2-s2.0-85116701045</dcvalue>
<dcvalue element="relation" qualifier="journalWebOfScienceCategory">Chemistry,&#x20;Physical</dcvalue>
<dcvalue element="relation" qualifier="journalWebOfScienceCategory">Physics,&#x20;Atomic,&#x20;Molecular&#x20;&amp;&#x20;Chemical</dcvalue>
<dcvalue element="relation" qualifier="journalResearchArea">Chemistry</dcvalue>
<dcvalue element="relation" qualifier="journalResearchArea">Physics</dcvalue>
<dcvalue element="type" qualifier="docType">Article</dcvalue>
<dcvalue element="subject" qualifier="keywordPlus">ACID&#x20;DISSOCIATION-CONSTANTS</dcvalue>
<dcvalue element="subject" qualifier="keywordPlus">DENSITY-FUNCTIONAL&#x20;METHODS</dcvalue>
<dcvalue element="subject" qualifier="keywordPlus">SOLVATION&#x20;FREE-ENERGIES</dcvalue>
<dcvalue element="subject" qualifier="keywordPlus">COMPLETE&#x20;BASIS-SET</dcvalue>
<dcvalue element="subject" qualifier="keywordPlus">PHOSPHONIC&#x20;ACID</dcvalue>
<dcvalue element="subject" qualifier="keywordPlus">PROTON&#x20;CONDUCTIVITY</dcvalue>
<dcvalue element="subject" qualifier="keywordPlus">PROTOGENIC&#x20;GROUP</dcvalue>
<dcvalue element="subject" qualifier="keywordPlus">NEURAL-NETWORKS</dcvalue>
<dcvalue element="subject" qualifier="keywordPlus">SULFONIC-ACID</dcvalue>
<dcvalue element="subject" qualifier="keywordPlus">VALUES</dcvalue>
</dublin_core>
