<?xml version="1.0" encoding="utf-8" standalone="no"?>
<dublin_core schema="dc">
<dcvalue element="contributor" qualifier="author">Choi,&#x20;Hyeong&#x20;Kyu</dcvalue>
<dcvalue element="contributor" qualifier="author">Paik,&#x20;Chong&#x20;Keun</dcvalue>
<dcvalue element="contributor" qualifier="author">Ko,&#x20;Hyun&#x20;Woo</dcvalue>
<dcvalue element="contributor" qualifier="author">Park,&#x20;Min-Chul</dcvalue>
<dcvalue element="contributor" qualifier="author">Kim,&#x20;Hyunwoo&#x20;J.</dcvalue>
<dcvalue element="date" qualifier="accessioned">2024-01-19T09:03:52Z</dcvalue>
<dcvalue element="date" qualifier="available">2024-01-19T09:03:52Z</dcvalue>
<dcvalue element="date" qualifier="created">2023-08-24</dcvalue>
<dcvalue element="date" qualifier="issued">2023-07</dcvalue>
<dcvalue element="identifier" qualifier="issn">2169-3536</dcvalue>
<dcvalue element="identifier" qualifier="uri">https:&#x2F;&#x2F;pubs.kist.re.kr&#x2F;handle&#x2F;201004&#x2F;113491</dcvalue>
<dcvalue element="description" qualifier="abstract">Recent&#x20;Transformer-based&#x20;object&#x20;detectors&#x20;have&#x20;achieved&#x20;remarkable&#x20;performance&#x20;on&#x20;benchmark&#x20;datasets,&#x20;but&#x20;few&#x20;have&#x20;addressed&#x20;the&#x20;real-world&#x20;challenge&#x20;of&#x20;object&#x20;detection&#x20;in&#x20;crowded&#x20;scenes&#x20;using&#x20;transformers.&#x20;This&#x20;limitation&#x20;stems&#x20;from&#x20;the&#x20;fixed&#x20;query&#x20;set&#x20;size&#x20;of&#x20;the&#x20;transformer&#x20;decoder,&#x20;which&#x20;restricts&#x20;the&#x20;model&amp;apos;s&#x20;inference&#x20;capacity.&#x20;To&#x20;overcome&#x20;this&#x20;challenge,&#x20;we&#x20;propose&#x20;Recurrent&#x20;Detection&#x20;Transformer&#x20;(Recurrent&#x20;DETR),&#x20;an&#x20;object&#x20;detector&#x20;that&#x20;iterates&#x20;the&#x20;decoder&#x20;block&#x20;to&#x20;render&#x20;more&#x20;predictions&#x20;with&#x20;a&#x20;finite&#x20;number&#x20;of&#x20;query&#x20;tokens.&#x20;Recurrent&#x20;DETR&#x20;can&#x20;adaptively&#x20;control&#x20;the&#x20;number&#x20;of&#x20;decoder&#x20;block&#x20;iterations&#x20;based&#x20;on&#x20;the&#x20;image&amp;apos;s&#x20;crowdedness&#x20;or&#x20;complexity,&#x20;resulting&#x20;in&#x20;a&#x20;variable-size&#x20;prediction&#x20;set.&#x20;This&#x20;is&#x20;enabled&#x20;by&#x20;our&#x20;novel&#x20;Pondering&#x20;Hungarian&#x20;Loss,&#x20;which&#x20;helps&#x20;the&#x20;model&#x20;to&#x20;learn&#x20;when&#x20;additional&#x20;computation&#x20;is&#x20;required&#x20;to&#x20;identify&#x20;all&#x20;the&#x20;objects&#x20;in&#x20;a&#x20;crowded&#x20;scene.&#x20;We&#x20;demonstrate&#x20;the&#x20;effectiveness&#x20;of&#x20;Recurrent&#x20;DETR&#x20;on&#x20;two&#x20;datasets:&#x20;COCO&#x20;2017,&#x20;which&#x20;represents&#x20;a&#x20;standard&#x20;setting,&#x20;and&#x20;CrowdHuman,&#x20;which&#x20;features&#x20;a&#x20;crowded&#x20;setting.&#x20;Our&#x20;experiments&#x20;on&#x20;both&#x20;datasets&#x20;show&#x20;that&#x20;Recurrent&#x20;DETR&#x20;achieves&#x20;significant&#x20;performance&#x20;gains&#x20;of&#x20;0.8&#x20;AP&#x20;and&#x20;0.4&#x20;AP,&#x20;respectively,&#x20;over&#x20;its&#x20;base&#x20;architectures.&#x20;Moreover,&#x20;we&#x20;conduct&#x20;comprehensive&#x20;analyses&#x20;under&#x20;different&#x20;query&#x20;set&#x20;size&#x20;constraints&#x20;to&#x20;provide&#x20;a&#x20;thorough&#x20;evaluation&#x20;of&#x20;our&#x20;proposed&#x20;method.</dcvalue>
<dcvalue element="language" qualifier="none">English</dcvalue>
<dcvalue element="publisher" qualifier="none">IEEE-INST&#x20;ELECTRICAL&#x20;ELECTRONICS&#x20;ENGINEERS&#x20;INC</dcvalue>
<dcvalue element="title" qualifier="none">Recurrent&#x20;DETR:&#x20;Transformer-Based&#x20;Object&#x20;Detection&#x20;for&#x20;Crowded&#x20;Scenes</dcvalue>
<dcvalue element="type" qualifier="none">Article</dcvalue>
<dcvalue element="identifier" qualifier="doi">10.1109&#x2F;ACCESS.2023.3293532</dcvalue>
<dcvalue element="description" qualifier="journalClass">1</dcvalue>
<dcvalue element="identifier" qualifier="bibliographicCitation">IEEE&#x20;ACCESS,&#x20;v.11,&#x20;pp.78623&#x20;-&#x20;78643</dcvalue>
<dcvalue element="citation" qualifier="title">IEEE&#x20;ACCESS</dcvalue>
<dcvalue element="citation" qualifier="volume">11</dcvalue>
<dcvalue element="citation" qualifier="startPage">78623</dcvalue>
<dcvalue element="citation" qualifier="endPage">78643</dcvalue>
<dcvalue element="description" qualifier="isOpenAccess">Y</dcvalue>
<dcvalue element="description" qualifier="journalRegisteredClass">scie</dcvalue>
<dcvalue element="description" qualifier="journalRegisteredClass">scopus</dcvalue>
<dcvalue element="identifier" qualifier="wosid">001042016700001</dcvalue>
<dcvalue element="identifier" qualifier="scopusid">2-s2.0-85164707936</dcvalue>
<dcvalue element="relation" qualifier="journalWebOfScienceCategory">Computer&#x20;Science,&#x20;Information&#x20;Systems</dcvalue>
<dcvalue element="relation" qualifier="journalWebOfScienceCategory">Engineering,&#x20;Electrical&#x20;&amp;&#x20;Electronic</dcvalue>
<dcvalue element="relation" qualifier="journalWebOfScienceCategory">Telecommunications</dcvalue>
<dcvalue element="relation" qualifier="journalResearchArea">Computer&#x20;Science</dcvalue>
<dcvalue element="relation" qualifier="journalResearchArea">Engineering</dcvalue>
<dcvalue element="relation" qualifier="journalResearchArea">Telecommunications</dcvalue>
<dcvalue element="type" qualifier="docType">Article</dcvalue>
<dcvalue element="subject" qualifier="keywordAuthor">Computer&#x20;vision</dcvalue>
<dcvalue element="subject" qualifier="keywordAuthor">object&#x20;detection</dcvalue>
<dcvalue element="subject" qualifier="keywordAuthor">detection&#x20;transformers</dcvalue>
<dcvalue element="subject" qualifier="keywordAuthor">dynamic&#x20;computation</dcvalue>
</dublin_core>
