<?xml version="1.0" encoding="utf-8" standalone="no"?>
<dublin_core schema="dc">
<dcvalue element="contributor" qualifier="author">Yi,&#x20;Gyeong&#x20;Hoon</dcvalue>
<dcvalue element="contributor" qualifier="author">Choi,&#x20;Jiwoo</dcvalue>
<dcvalue element="contributor" qualifier="author">Song,&#x20;Hyeongyun</dcvalue>
<dcvalue element="contributor" qualifier="author">Miano,&#x20;Olivia</dcvalue>
<dcvalue element="contributor" qualifier="author">Choi,&#x20;Jaewoong</dcvalue>
<dcvalue element="contributor" qualifier="author">Bang,&#x20;Kihoon</dcvalue>
<dcvalue element="contributor" qualifier="author">Lee,&#x20;Byungju</dcvalue>
<dcvalue element="contributor" qualifier="author">Sohn,&#x20;Seok&#x20;Su</dcvalue>
<dcvalue element="contributor" qualifier="author">Buttler,&#x20;David</dcvalue>
<dcvalue element="contributor" qualifier="author">Hiszpanski,&#x20;Anna</dcvalue>
<dcvalue element="contributor" qualifier="author">Han,&#x20;Sang&#x20;Soo</dcvalue>
<dcvalue element="contributor" qualifier="author">Kim,&#x20;Donghun</dcvalue>
<dcvalue element="date" qualifier="accessioned">2025-03-19T15:31:18Z</dcvalue>
<dcvalue element="date" qualifier="available">2025-03-19T15:31:18Z</dcvalue>
<dcvalue element="date" qualifier="created">2025-03-19</dcvalue>
<dcvalue element="date" qualifier="issued">2025-04</dcvalue>
<dcvalue element="identifier" qualifier="uri">https:&#x2F;&#x2F;pubs.kist.re.kr&#x2F;handle&#x2F;201004&#x2F;151918</dcvalue>
<dcvalue element="description" qualifier="abstract">Efficiently&#x20;extracting&#x20;data&#x20;from&#x20;tables&#x20;in&#x20;the&#x20;scientific&#x20;literature&#x20;is&#x20;pivotal&#x20;for&#x20;building&#x20;large-scale&#x20;databases.&#x20;However,&#x20;the&#x20;tables&#x20;reported&#x20;in&#x20;materials&#x20;science&#x20;papers&#x20;exist&#x20;in&#x20;highly&#x20;diverse&#x20;forms;&#x20;thus,&#x20;rule-based&#x20;extractions&#x20;are&#x20;an&#x20;ineffective&#x20;approach.&#x20;To&#x20;overcome&#x20;this&#x20;challenge,&#x20;the&#x20;study&#x20;presents&#x20;MaTableGPT,&#x20;which&#x20;is&#x20;a&#x20;GPT-based&#x20;table&#x20;data&#x20;extractor&#x20;from&#x20;the&#x20;materials&#x20;science&#x20;literature.&#x20;MaTableGPT&#x20;features&#x20;key&#x20;strategies&#x20;of&#x20;table&#x20;data&#x20;representation&#x20;and&#x20;table&#x20;splitting&#x20;for&#x20;better&#x20;GPT&#x20;comprehension&#x20;and&#x20;filtering&#x20;hallucinated&#x20;information&#x20;through&#x20;follow-up&#x20;questions.&#x20;When&#x20;applied&#x20;to&#x20;a&#x20;vast&#x20;volume&#x20;of&#x20;water&#x20;splitting&#x20;catalysis&#x20;literature,&#x20;MaTableGPT&#x20;achieves&#x20;an&#x20;extraction&#x20;accuracy&#x20;(total&#x20;F1&#x20;score)&#x20;of&#x20;up&#x20;to&#x20;96.8%.&#x20;Through&#x20;comprehensive&#x20;evaluations&#x20;of&#x20;the&#x20;GPT&#x20;usage&#x20;cost,&#x20;labeling&#x20;cost,&#x20;and&#x20;extraction&#x20;accuracy&#x20;for&#x20;the&#x20;learning&#x20;methods&#x20;of&#x20;zero-shot,&#x20;few-shot,&#x20;and&#x20;fine-tuning,&#x20;the&#x20;study&#x20;presents&#x20;a&#x20;Pareto-front&#x20;mapping&#x20;where&#x20;the&#x20;few-shot&#x20;learning&#x20;method&#x20;is&#x20;found&#x20;to&#x20;be&#x20;the&#x20;most&#x20;balanced&#x20;solution&#x20;owing&#x20;to&#x20;both&#x20;its&#x20;high&#x20;extraction&#x20;accuracy&#x20;(total&#x20;F1&#x20;score&#x20;&gt;95%)&#x20;and&#x20;low&#x20;cost&#x20;(GPT&#x20;usage&#x20;cost&#x20;of&#x20;5.97&#x20;US&#x20;dollars&#x20;and&#x20;labeling&#x20;cost&#x20;of&#x20;10&#x20;I&#x2F;O&#x20;paired&#x20;examples).&#x20;The&#x20;statistical&#x20;analyses&#x20;conducted&#x20;on&#x20;the&#x20;database&#x20;generated&#x20;by&#x20;MaTableGPT&#x20;revealed&#x20;valuable&#x20;insights&#x20;into&#x20;the&#x20;distribution&#x20;of&#x20;the&#x20;overpotential&#x20;and&#x20;elemental&#x20;utilization&#x20;across&#x20;the&#x20;reported&#x20;catalysts&#x20;in&#x20;the&#x20;water&#x20;splitting&#x20;literature.</dcvalue>
<dcvalue element="language" qualifier="none">English</dcvalue>
<dcvalue element="publisher" qualifier="none">Wiley-VCH&#x20;Verlag</dcvalue>
<dcvalue element="title" qualifier="none">MaTableGPT:&#x20;GPT-Based&#x20;Table&#x20;Data&#x20;Extractor&#x20;from&#x20;Materials&#x20;Science&#x20;Literature</dcvalue>
<dcvalue element="type" qualifier="none">Article</dcvalue>
<dcvalue element="identifier" qualifier="doi">10.1002&#x2F;advs.202408221</dcvalue>
<dcvalue element="description" qualifier="journalClass">1</dcvalue>
<dcvalue element="identifier" qualifier="bibliographicCitation">Advanced&#x20;Science,&#x20;v.12,&#x20;no.16</dcvalue>
<dcvalue element="citation" qualifier="title">Advanced&#x20;Science</dcvalue>
<dcvalue element="citation" qualifier="volume">12</dcvalue>
<dcvalue element="citation" qualifier="number">16</dcvalue>
<dcvalue element="description" qualifier="isOpenAccess">Y</dcvalue>
<dcvalue element="description" qualifier="journalRegisteredClass">scie</dcvalue>
<dcvalue element="description" qualifier="journalRegisteredClass">scopus</dcvalue>
<dcvalue element="identifier" qualifier="wosid">001405309300001</dcvalue>
<dcvalue element="identifier" qualifier="scopusid">2-s2.0-85215658421</dcvalue>
<dcvalue element="relation" qualifier="journalWebOfScienceCategory">Chemistry,&#x20;Multidisciplinary</dcvalue>
<dcvalue element="relation" qualifier="journalWebOfScienceCategory">Nanoscience&#x20;&amp;&#x20;Nanotechnology</dcvalue>
<dcvalue element="relation" qualifier="journalWebOfScienceCategory">Materials&#x20;Science,&#x20;Multidisciplinary</dcvalue>
<dcvalue element="relation" qualifier="journalResearchArea">Chemistry</dcvalue>
<dcvalue element="relation" qualifier="journalResearchArea">Science&#x20;&amp;&#x20;Technology&#x20;-&#x20;Other&#x20;Topics</dcvalue>
<dcvalue element="relation" qualifier="journalResearchArea">Materials&#x20;Science</dcvalue>
<dcvalue element="type" qualifier="docType">Article</dcvalue>
<dcvalue element="subject" qualifier="keywordPlus">OXYGEN&#x20;EVOLUTION</dcvalue>
<dcvalue element="subject" qualifier="keywordPlus">REDUCTION</dcvalue>
<dcvalue element="subject" qualifier="keywordPlus">CATALYST</dcvalue>
<dcvalue element="subject" qualifier="keywordAuthor">GPT</dcvalue>
<dcvalue element="subject" qualifier="keywordAuthor">large&#x20;language&#x20;models</dcvalue>
<dcvalue element="subject" qualifier="keywordAuthor">literature&#x20;mining</dcvalue>
<dcvalue element="subject" qualifier="keywordAuthor">machine&#x20;learning</dcvalue>
<dcvalue element="subject" qualifier="keywordAuthor">materials&#x20;science</dcvalue>
<dcvalue element="subject" qualifier="keywordAuthor">table&#x20;data&#x20;extraction</dcvalue>
<dcvalue element="subject" qualifier="keywordAuthor">water&#x20;splitting&#x20;catalysis</dcvalue>
</dublin_core>
