Computer Vision and Pattern Recognition

<!DOCTYPE html> <html lang="en"> <head> <title>Computer Vision and Pattern Recognition </title> <meta name="viewport" content="width=device-width, initial-scale=1"> <link rel="apple-touch-icon" sizes="180x180" href="/static/browse/0.3.4/images/icons/apple-touch-icon.png"> <link rel="icon" type="image/png" sizes="32x32" href="/static/browse/0.3.4/images/icons/favicon-32x32.png"> <link rel="icon" type="image/png" sizes="16x16" href="/static/browse/0.3.4/images/icons/favicon-16x16.png"> <link rel="manifest" href="/static/browse/0.3.4/images/icons/site.webmanifest"> <link rel="mask-icon" href="/static/browse/0.3.4/images/icons/safari-pinned-tab.svg" color="#5bbad5"> <meta name="msapplication-TileColor" content="#da532c"> <meta name="theme-color" content="#ffffff"> <link rel="stylesheet" type="text/css" media="screen" href="/static/browse/0.3.4/css/arXiv.css?v=20241206" /> <link rel="stylesheet" type="text/css" media="print" href="/static/browse/0.3.4/css/arXiv-print.css?v=20200611" /> <link rel="stylesheet" type="text/css" media="screen" href="/static/browse/0.3.4/css/browse_search.css" /> <script language="javascript" src="/static/browse/0.3.4/js/accordion.js" /></script> <script src="/static/browse/0.3.4/js/mathjaxToggle.min.js" type="text/javascript"></script> <script type="text/javascript" language="javascript">mathjaxToggle();</script> </head> <body class="with-cu-identity"> <div class="flex-wrap-footer"> <header> <a href="#content" class="is-sr-only">Skip to main content</a>  <div class="columns is-vcentered is-hidden-mobile" id="cu-identity"> <div class="column" id="cu-logo"> <a href="https://www.cornell.edu/"><img src="/static/browse/0.3.4/images/icons/cu/cornell-reduced-white-SMALL.svg" alt="Cornell University" /></a> </div><div class="column" id="support-ack"> <span id="support-ack-url">We gratefully acknowledge support from the Simons Foundation, <a href="https://info.arxiv.org/about/ourmembers.html">member institutions</a>, and all contributors.</span> <a href="https://info.arxiv.org/about/donate.html" class="btn-header-donate">Donate</a> </div> </div> <div id="header" class="is-hidden-mobile"> <a aria-hidden="true" tabindex="-1" href="/IgnoreMe"></a> <div class="header-breadcrumbs"> <a href="/"><img src="/static/browse/0.3.4/images/arxiv-logo-one-color-white.svg" alt="arxiv logo" style="height:40px;"/></a> <span>></span> <a href="/list/cs.CV/recent">cs.CV</a> </div> <div class="search-block level-right"> <form class="level-item mini-search" method="GET" action="https://arxiv.org/search"> <div class="field has-addons"> <div class="control"> <input class="input is-small" type="text" name="query" placeholder="Search..." aria-label="Search term or terms" /> <p class="help"><a href="https://info.arxiv.org/help">Help</a> | <a href="https://arxiv.org/search/advanced">Advanced Search</a></p> </div> <div class="control"> <div class="select is-small"> <select name="searchtype" aria-label="Field to search"> <option value="all" selected="selected">All fields</option> <option value="title">Title</option> <option value="author">Author</option> <option value="abstract">Abstract</option> <option value="comments">Comments</option> <option value="journal_ref">Journal reference</option> <option value="acm_class">ACM classification</option> <option value="msc_class">MSC classification</option> <option value="report_num">Report number</option> <option value="paper_id">arXiv identifier</option> <option value="doi">DOI</option> <option value="orcid">ORCID</option> <option value="author_id">arXiv author ID</option> <option value="help">Help pages</option> <option value="full_text">Full text</option> </select> </div> </div> <input type="hidden" name="source" value="header"> <button class="button is-small is-cul-darker">Search</button> </div> </form> </div> </div> <div class="mobile-header"> <div class="columns is-mobile"> <div class="column logo-arxiv"><a href="https://arxiv.org/"><img src="/static/browse/0.3.4/images/arxiv-logomark-small-white.svg" alt="arXiv logo" style="height:60px;" /></a></div> <div class="column logo-cornell"><a href="https://www.cornell.edu/"> <picture> <source media="(min-width: 501px)" srcset="/static/browse/0.3.4/images/icons/cu/cornell-reduced-white-SMALL.svg 400w" sizes="400w" /> <source srcset="/static/browse/0.3.4/images/icons/cu/cornell_seal_simple_black.svg 2x" /> <img src="/static/browse/0.3.4/images/icons/cu/cornell-reduced-white-SMALL.svg" alt="Cornell University Logo" /> </picture> </a></div> <div class="column nav" id="toggle-container" role="menubar"> <button class="toggle-control"><svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 512 512" class="icon filter-white"><title>open search</title><path d="M505 442.7L405.3 343c-4.5-4.5-10.6-7-17-7H372c27.6-35.3 44-79.7 44-128C416 93.1 322.9 0 208 0S0 93.1 0 208s93.1 208 208 208c48.3 0 92.7-16.4 128-44v16.3c0 6.4 2.5 12.5 7 17l99.7 99.7c9.4 9.4 24.6 9.4 33.9 0l28.3-28.3c9.4-9.4 9.4-24.6.1-34zM208 336c-70.7 0-128-57.2-128-128 0-70.7 57.2-128 128-128 70.7 0 128 57.2 128 128 0 70.7-57.2 128-128 128z"/></svg></button> <div class="mobile-toggle-block toggle-target"> <form class="mobile-search-form" method="GET" action="https://arxiv.org/search"> <div class="field has-addons"> <input class="input" type="text" name="query" placeholder="Search..." aria-label="Search term or terms" /> <input type="hidden" name="source" value="header"> <input type="hidden" name="searchtype" value="all"> <button class="button">GO</button> </div> </form> </div> <button class="toggle-control"><svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 448 512" class="icon filter-white" role="menu"><title>open navigation menu</title><path d="M16 132h416c8.837 0 16-7.163 16-16V76c0-8.837-7.163-16-16-16H16C7.163 60 0 67.163 0 76v40c0 8.837 7.163 16 16 16zm0 160h416c8.837 0 16-7.163 16-16v-40c0-8.837-7.163-16-16-16H16c-8.837 0-16 7.163-16 16v40c0 8.837 7.163 16 16 16zm0 160h416c8.837 0 16-7.163 16-16v-40c0-8.837-7.163-16-16-16H16c-8.837 0-16 7.163-16 16v40c0 8.837 7.163 16 16 16z"/ ></svg></button> <div class="mobile-toggle-block toggle-target"> <nav class="mobile-menu" aria-labelledby="mobilemenulabel"> <h2 id="mobilemenulabel">quick links</h2> <ul> <li><a href="https://arxiv.org/login">Login</a></li> <li><a href="https://info.arxiv.org/help">Help Pages</a></li> <li><a href="https://info.arxiv.org/about">About</a></li> </ul> </nav> </div> </div> </div> </div> </header> <main> <div id="content"> <div id='content-inner'> <div id='dlpage'> <h1>Computer Vision and Pattern Recognition</h1> <h2>Authors and titles for recent submissions</h2> <ul> <li> <a href="/list/cs.CV/recent?skip=0&show=50"> Fri, 21 Mar 2025 </a> </li><li> <a href="/list/cs.CV/recent?skip=153&show=50"> Thu, 20 Mar 2025 </a> </li><li> <a href="/list/cs.CV/recent?skip=314&show=50"> Wed, 19 Mar 2025 </a> </li><li> <a href="/list/cs.CV/recent?skip=486&show=50"> Tue, 18 Mar 2025 </a> </li><li> <a href="/list/cs.CV/recent?skip=814&show=50"> Mon, 17 Mar 2025 </a> </li></ul> <p>See today's <a id="new-cs.CV" aria-labelledby="new-cs.CV" href="/list/cs.CV/new">new</a> changes</p> <div class='paging'>Total of 993 entries : <span>1-50</span> <a href=/list/cs.CV/recent?skip=50&show=50>51-100</a> <a href=/list/cs.CV/recent?skip=100&show=50>101-150</a> <a href=/list/cs.CV/recent?skip=150&show=50>151-200</a> <span>...</span> <a href=/list/cs.CV/recent?skip=950&show=50>951-993</a> </div> <div class='morefewer'>Showing up to 50 entries per page: <a href=/list/cs.CV/recent?skip=0&show=25 rel="nofollow"> fewer</a> | <a href=/list/cs.CV/recent?skip=0&show=100 rel="nofollow"> more</a> | <a href=/list/cs.CV/recent?skip=0&show=2000 rel="nofollow"> all</a> </div> <dl id='articles'> <h3>Fri, 21 Mar 2025 (showing first 50 of 153 entries )</h3> <dt> <a name='item1'>[1]</a> <a href ="/abs/2503.16430" title="Abstract" id="2503.16430"> arXiv:2503.16430 </a> [<a href="/pdf/2503.16430" title="Download PDF" id="pdf-2503.16430" aria-labelledby="pdf-2503.16430">pdf</a>, <a href="https://arxiv.org/html/2503.16430v1" title="View HTML" id="html-2503.16430" aria-labelledby="html-2503.16430" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16430" title="Other formats" id="oth-2503.16430" aria-labelledby="oth-2503.16430">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Bridging Continuous and Discrete Tokens for Autoregressive Visual Generation </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+Y">Yuqing Wang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Lin,+Z">Zhijie Lin</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Teng,+Y">Yao Teng</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhu,+Y">Yuanzhi Zhu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Ren,+S">Shuhuai Ren</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Feng,+J">Jiashi Feng</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Liu,+X">Xihui Liu</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Project page: <a href="https://yuqingwang1029.github.io/TokenBridge" rel="external noopener nofollow" class="link-external link-https">this https URL</a> </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item2'>[2]</a> <a href ="/abs/2503.16429" title="Abstract" id="2503.16429"> arXiv:2503.16429 </a> [<a href="/pdf/2503.16429" title="Download PDF" id="pdf-2503.16429" aria-labelledby="pdf-2503.16429">pdf</a>, <a href="https://arxiv.org/html/2503.16429v1" title="View HTML" id="html-2503.16429" aria-labelledby="html-2503.16429" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16429" title="Other formats" id="oth-2503.16429" aria-labelledby="oth-2503.16429">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Sonata: Self-Supervised Learning of Reliable Point Representations </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Wu,+X">Xiaoyang Wu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=DeTone,+D">Daniel DeTone</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Frost,+D">Duncan Frost</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Shen,+T">Tianwei Shen</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Xie,+C">Chris Xie</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Yang,+N">Nan Yang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Engel,+J">Jakob Engel</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Newcombe,+R">Richard Newcombe</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhao,+H">Hengshuang Zhao</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Straub,+J">Julian Straub</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> CVPR 2025, produced by Pointcept x Meta, project page: <a href="https://xywu.me/sonata/" rel="external noopener nofollow" class="link-external link-https">this https URL</a> </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item3'>[3]</a> <a href ="/abs/2503.16426" title="Abstract" id="2503.16426"> arXiv:2503.16426 </a> [<a href="/pdf/2503.16426" title="Download PDF" id="pdf-2503.16426" aria-labelledby="pdf-2503.16426">pdf</a>, <a href="https://arxiv.org/html/2503.16426v1" title="View HTML" id="html-2503.16426" aria-labelledby="html-2503.16426" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16426" title="Other formats" id="oth-2503.16426" aria-labelledby="oth-2503.16426">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> DynamicVis: An Efficient and General Visual Foundation Model for Remote Sensing Image Understanding </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Chen,+K">Keyan Chen</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Liu,+C">Chenyang Liu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Chen,+B">Bowen Chen</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Li,+W">Wenyuan Li</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zou,+Z">Zhengxia Zou</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Shi,+Z">Zhenwei Shi</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item4'>[4]</a> <a href ="/abs/2503.16425" title="Abstract" id="2503.16425"> arXiv:2503.16425 </a> [<a href="/pdf/2503.16425" title="Download PDF" id="pdf-2503.16425" aria-labelledby="pdf-2503.16425">pdf</a>, <a href="https://arxiv.org/html/2503.16425v1" title="View HTML" id="html-2503.16425" aria-labelledby="html-2503.16425" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16425" title="Other formats" id="oth-2503.16425" aria-labelledby="oth-2503.16425">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Tokenize Image as a Set </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Geng,+Z">Zigang Geng</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Xu,+M">Mengde Xu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Hu,+H">Han Hu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Gu,+S">Shuyang Gu</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item5'>[5]</a> <a href ="/abs/2503.16423" title="Abstract" id="2503.16423"> arXiv:2503.16423 </a> [<a href="/pdf/2503.16423" title="Download PDF" id="pdf-2503.16423" aria-labelledby="pdf-2503.16423">pdf</a>, <a href="https://arxiv.org/html/2503.16423v1" title="View HTML" id="html-2503.16423" aria-labelledby="html-2503.16423" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16423" title="Other formats" id="oth-2503.16423" aria-labelledby="oth-2503.16423">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> GAEA: A Geolocation Aware Conversational Model </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Campos,+R">Ron Campos</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Vayani,+A">Ashmal Vayani</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Kulkarni,+P+P">Parth Parag Kulkarni</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Gupta,+R">Rohit Gupta</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Dutta,+A">Aritra Dutta</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Shah,+M">Mubarak Shah</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> The dataset and code used in this submission is available at: <a href="https://ucf-crcv.github.io/GAEA/" rel="external noopener nofollow" class="link-external link-https">this https URL</a> </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Machine Learning (cs.LG) </div> </div> </dd> <dt> <a name='item6'>[6]</a> <a href ="/abs/2503.16422" title="Abstract" id="2503.16422"> arXiv:2503.16422 </a> [<a href="/pdf/2503.16422" title="Download PDF" id="pdf-2503.16422" aria-labelledby="pdf-2503.16422">pdf</a>, <a href="https://arxiv.org/html/2503.16422v1" title="View HTML" id="html-2503.16422" aria-labelledby="html-2503.16422" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16422" title="Other formats" id="oth-2503.16422" aria-labelledby="oth-2503.16422">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> 1000+ FPS 4D Gaussian Splatting for Dynamic Scene Rendering </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Yuan,+Y">Yuheng Yuan</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Shen,+Q">Qiuhong Shen</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Yang,+X">Xingyi Yang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+X">Xinchao Wang</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item7'>[7]</a> <a href ="/abs/2503.16421" title="Abstract" id="2503.16421"> arXiv:2503.16421 </a> [<a href="/pdf/2503.16421" title="Download PDF" id="pdf-2503.16421" aria-labelledby="pdf-2503.16421">pdf</a>, <a href="https://arxiv.org/html/2503.16421v1" title="View HTML" id="html-2503.16421" aria-labelledby="html-2503.16421" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16421" title="Other formats" id="oth-2503.16421" aria-labelledby="oth-2503.16421">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> MagicMotion: Controllable Video Generation with Dense-to-Sparse Trajectory Guidance </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Li,+Q">Quanhao Li</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Xing,+Z">Zhen Xing</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+R">Rui Wang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhang,+H">Hui Zhang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Dai,+Q">Qi Dai</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wu,+Z">Zuxuan Wu</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Artificial Intelligence (cs.AI); Machine Learning (cs.LG); Multimedia (cs.MM) </div> </div> </dd> <dt> <a name='item8'>[8]</a> <a href ="/abs/2503.16420" title="Abstract" id="2503.16420"> arXiv:2503.16420 </a> [<a href="/pdf/2503.16420" title="Download PDF" id="pdf-2503.16420" aria-labelledby="pdf-2503.16420">pdf</a>, <a href="https://arxiv.org/html/2503.16420v1" title="View HTML" id="html-2503.16420" aria-labelledby="html-2503.16420" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16420" title="Other formats" id="oth-2503.16420" aria-labelledby="oth-2503.16420">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> SynCity: Training-Free Generation of 3D Worlds </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Engstler,+P">Paul Engstler</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Shtedritski,+A">Aleksandar Shtedritski</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Laina,+I">Iro Laina</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Rupprecht,+C">Christian Rupprecht</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Vedaldi,+A">Andrea Vedaldi</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Project page: <a href="https://research.paulengstler.com/syncity/" rel="external noopener nofollow" class="link-external link-https">this https URL</a> </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item9'>[9]</a> <a href ="/abs/2503.16418" title="Abstract" id="2503.16418"> arXiv:2503.16418 </a> [<a href="/pdf/2503.16418" title="Download PDF" id="pdf-2503.16418" aria-labelledby="pdf-2503.16418">pdf</a>, <a href="https://arxiv.org/html/2503.16418v1" title="View HTML" id="html-2503.16418" aria-labelledby="html-2503.16418" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16418" title="Other formats" id="oth-2503.16418" aria-labelledby="oth-2503.16418">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> InfiniteYou: Flexible Photo Recrafting While Preserving Your Identity </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Jiang,+L">Liming Jiang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Yan,+Q">Qing Yan</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Jia,+Y">Yumin Jia</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Liu,+Z">Zichuan Liu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Kang,+H">Hao Kang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Lu,+X">Xin Lu</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Project page: <a href="https://bytedance.github.io/InfiniteYou/" rel="external noopener nofollow" class="link-external link-https">this https URL</a> Code and model: <a href="https://github.com/bytedance/InfiniteYou" rel="external noopener nofollow" class="link-external link-https">this https URL</a> </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Machine Learning (cs.LG) </div> </div> </dd> <dt> <a name='item10'>[10]</a> <a href ="/abs/2503.16413" title="Abstract" id="2503.16413"> arXiv:2503.16413 </a> [<a href="/pdf/2503.16413" title="Download PDF" id="pdf-2503.16413" aria-labelledby="pdf-2503.16413">pdf</a>, <a href="https://arxiv.org/html/2503.16413v1" title="View HTML" id="html-2503.16413" aria-labelledby="html-2503.16413" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16413" title="Other formats" id="oth-2503.16413" aria-labelledby="oth-2503.16413">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> M3: 3D-Spatial MultiModal Memory </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Zou,+X">Xueyan Zou</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Song,+Y">Yuchen Song</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Qiu,+R">Ri-Zhao Qiu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Peng,+X">Xuanbin Peng</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Ye,+J">Jianglong Ye</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Liu,+S">Sifei Liu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+X">Xiaolong Wang</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> ICLR2025 homepage: <a href="https://m3-spatial-memory.github.io" rel="external noopener nofollow" class="link-external link-https">this https URL</a> code: <a href="https://github.com/MaureenZOU/m3-spatial" rel="external noopener nofollow" class="link-external link-https">this https URL</a> </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Robotics (cs.RO) </div> </div> </dd> <dt> <a name='item11'>[11]</a> <a href ="/abs/2503.16412" title="Abstract" id="2503.16412"> arXiv:2503.16412 </a> [<a href="/pdf/2503.16412" title="Download PDF" id="pdf-2503.16412" aria-labelledby="pdf-2503.16412">pdf</a>, <a href="https://arxiv.org/html/2503.16412v1" title="View HTML" id="html-2503.16412" aria-labelledby="html-2503.16412" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16412" title="Other formats" id="oth-2503.16412" aria-labelledby="oth-2503.16412">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> DreamTexture: Shape from Virtual Texture with Analysis by Augmentation </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Bhattarai,+A+R">Ananta R. Bhattarai</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=He,+X">Xingzhe He</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Sheffer,+A">Alla Sheffer</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Rhodin,+H">Helge Rhodin</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Project page: <a href="https://anantarb.github.io/dreamtexture/" rel="external noopener nofollow" class="link-external link-https">this https URL</a> </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Artificial Intelligence (cs.AI); Machine Learning (cs.LG) </div> </div> </dd> <dt> <a name='item12'>[12]</a> <a href ="/abs/2503.16399" title="Abstract" id="2503.16399"> arXiv:2503.16399 </a> [<a href="/pdf/2503.16399" title="Download PDF" id="pdf-2503.16399" aria-labelledby="pdf-2503.16399">pdf</a>, <a href="https://arxiv.org/html/2503.16399v1" title="View HTML" id="html-2503.16399" aria-labelledby="html-2503.16399" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16399" title="Other formats" id="oth-2503.16399" aria-labelledby="oth-2503.16399">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> SA-Occ: Satellite-Assisted 3D Occupancy Prediction in Real World </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Chen,+C">Chen Chen</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+Z">Zhirui Wang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Sheng,+T">Taowei Sheng</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Jiang,+Y">Yi Jiang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Li,+Y">Yundu Li</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Cheng,+P">Peirui Cheng</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhang,+L">Luning Zhang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Chen,+K">Kaiqiang Chen</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Hu,+Y">Yanfeng Hu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Yang,+X">Xue Yang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Sun,+X">Xian Sun</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> 10 pages </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Artificial Intelligence (cs.AI) </div> </div> </dd> <dt> <a name='item13'>[13]</a> <a href ="/abs/2503.16397" title="Abstract" id="2503.16397"> arXiv:2503.16397 </a> [<a href="/pdf/2503.16397" title="Download PDF" id="pdf-2503.16397" aria-labelledby="pdf-2503.16397">pdf</a>, <a href="https://arxiv.org/html/2503.16397v1" title="View HTML" id="html-2503.16397" aria-labelledby="html-2503.16397" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16397" title="Other formats" id="oth-2503.16397" aria-labelledby="oth-2503.16397">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Scale-wise Distillation of Diffusion Models </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Starodubcev,+N">Nikita Starodubcev</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Kuznedelev,+D">Denis Kuznedelev</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Babenko,+A">Artem Babenko</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Baranchuk,+D">Dmitry Baranchuk</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item14'>[14]</a> <a href ="/abs/2503.16396" title="Abstract" id="2503.16396"> arXiv:2503.16396 </a> [<a href="/pdf/2503.16396" title="Download PDF" id="pdf-2503.16396" aria-labelledby="pdf-2503.16396">pdf</a>, <a href="https://arxiv.org/html/2503.16396v1" title="View HTML" id="html-2503.16396" aria-labelledby="html-2503.16396" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16396" title="Other formats" id="oth-2503.16396" aria-labelledby="oth-2503.16396">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> SV4D 2.0: Enhancing Spatio-Temporal Consistency in Multi-View Video Diffusion for High-Quality 4D Generation </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Yao,+C">Chun-Han Yao</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Xie,+Y">Yiming Xie</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Voleti,+V">Vikram Voleti</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Jiang,+H">Huaizu Jiang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Jampani,+V">Varun Jampani</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item15'>[15]</a> <a href ="/abs/2503.16394" title="Abstract" id="2503.16394"> arXiv:2503.16394 </a> [<a href="/pdf/2503.16394" title="Download PDF" id="pdf-2503.16394" aria-labelledby="pdf-2503.16394">pdf</a>, <a href="https://arxiv.org/html/2503.16394v1" title="View HTML" id="html-2503.16394" aria-labelledby="html-2503.16394" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16394" title="Other formats" id="oth-2503.16394" aria-labelledby="oth-2503.16394">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Do Visual Imaginations Improve Vision-and-Language Navigation Agents? </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Perincherry,+A">Akhil Perincherry</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Krantz,+J">Jacob Krantz</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Lee,+S">Stefan Lee</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Artificial Intelligence (cs.AI); Computation and Language (cs.CL); Robotics (cs.RO) </div> </div> </dd> <dt> <a name='item16'>[16]</a> <a href ="/abs/2503.16378" title="Abstract" id="2503.16378"> arXiv:2503.16378 </a> [<a href="/pdf/2503.16378" title="Download PDF" id="pdf-2503.16378" aria-labelledby="pdf-2503.16378">pdf</a>, <a href="https://arxiv.org/html/2503.16378v1" title="View HTML" id="html-2503.16378" aria-labelledby="html-2503.16378" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16378" title="Other formats" id="oth-2503.16378" aria-labelledby="oth-2503.16378">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Panoptic-CUDAL Technical Report: Rural Australia Point Cloud Dataset in Rainy Conditions </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Tseng,+T">Tzu-Yun Tseng</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Nekrasov,+A">Alexey Nekrasov</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Burdorf,+M">Malcolm Burdorf</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Leibe,+B">Bastian Leibe</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Berrio,+J+S">Julie Stephany Berrio</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Shan,+M">Mao Shan</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Worrall,+S">Stewart Worrall</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item17'>[17]</a> <a href ="/abs/2503.16376" title="Abstract" id="2503.16376"> arXiv:2503.16376 </a> [<a href="/pdf/2503.16376" title="Download PDF" id="pdf-2503.16376" aria-labelledby="pdf-2503.16376">pdf</a>, <a href="https://arxiv.org/html/2503.16376v1" title="View HTML" id="html-2503.16376" aria-labelledby="html-2503.16376" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16376" title="Other formats" id="oth-2503.16376" aria-labelledby="oth-2503.16376">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> LaPIG: Cross-Modal Generation of Paired Thermal and Visible Facial Images </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+L">Leyang Wang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Lin,+J">Joice Lin</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item18'>[18]</a> <a href ="/abs/2503.16375" title="Abstract" id="2503.16375"> arXiv:2503.16375 </a> [<a href="/pdf/2503.16375" title="Download PDF" id="pdf-2503.16375" aria-labelledby="pdf-2503.16375">pdf</a>, <a href="https://arxiv.org/html/2503.16375v1" title="View HTML" id="html-2503.16375" aria-labelledby="html-2503.16375" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16375" title="Other formats" id="oth-2503.16375" aria-labelledby="oth-2503.16375">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> NuiScene: Exploring Efficient Generation of Unbounded Outdoor Scenes </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Lee,+H">Han-Hung Lee</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Han,+Q">Qinghong Han</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Chang,+A+X">Angel X. Chang</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item19'>[19]</a> <a href ="/abs/2503.16365" title="Abstract" id="2503.16365"> arXiv:2503.16365 </a> [<a href="/pdf/2503.16365" title="Download PDF" id="pdf-2503.16365" aria-labelledby="pdf-2503.16365">pdf</a>, <a href="https://arxiv.org/html/2503.16365v1" title="View HTML" id="html-2503.16365" aria-labelledby="html-2503.16365" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16365" title="Other formats" id="oth-2503.16365" aria-labelledby="oth-2503.16365">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> JARVIS-VLA: Post-Training Large-Scale Vision Language Models to Play Visual Games with Keyboards and Mouse </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Li,+M">Muyao Li</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+Z">Zihao Wang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=He,+K">Kaichen He</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Ma,+X">Xiaojian Ma</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Liang,+Y">Yitao Liang</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> 22 pages, 5 figures </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Artificial Intelligence (cs.AI) </div> </div> </dd> <dt> <a name='item20'>[20]</a> <a href ="/abs/2503.16357" title="Abstract" id="2503.16357"> arXiv:2503.16357 </a> [<a href="/pdf/2503.16357" title="Download PDF" id="pdf-2503.16357" aria-labelledby="pdf-2503.16357">pdf</a>, <a href="https://arxiv.org/html/2503.16357v1" title="View HTML" id="html-2503.16357" aria-labelledby="html-2503.16357" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16357" title="Other formats" id="oth-2503.16357" aria-labelledby="oth-2503.16357">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> UniSync: A Unified Framework for Audio-Visual Synchronization </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Feng,+T">Tao Feng</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Xie,+Y">Yifan Xie</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Guan,+X">Xun Guan</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Song,+J">Jiyuan Song</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Liu,+Z">Zhou Liu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Ma,+F">Fei Ma</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Yu,+F">Fei Yu</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> 7 pages, 3 figures, accepted by ICME 2025 </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Sound (cs.SD); Audio and Speech Processing (eess.AS) </div> </div> </dd> <dt> <a name='item21'>[21]</a> <a href ="/abs/2503.16338" title="Abstract" id="2503.16338"> arXiv:2503.16338 </a> [<a href="/pdf/2503.16338" title="Download PDF" id="pdf-2503.16338" aria-labelledby="pdf-2503.16338">pdf</a>, <a href="https://arxiv.org/html/2503.16338v1" title="View HTML" id="html-2503.16338" aria-labelledby="html-2503.16338" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16338" title="Other formats" id="oth-2503.16338" aria-labelledby="oth-2503.16338">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Gaussian Graph Network: Learning Efficient and Generalizable Gaussian Representations from Multi-view Images </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Zhang,+S">Shengjun Zhang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Fei,+X">Xin Fei</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Liu,+F">Fangfu Liu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Song,+H">Haixu Song</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Duan,+Y">Yueqi Duan</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> NeurIPS 2024 </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item22'>[22]</a> <a href ="/abs/2503.16322" title="Abstract" id="2503.16322"> arXiv:2503.16322 </a> [<a href="/pdf/2503.16322" title="Download PDF" id="pdf-2503.16322" aria-labelledby="pdf-2503.16322">pdf</a>, <a href="https://arxiv.org/html/2503.16322v1" title="View HTML" id="html-2503.16322" aria-labelledby="html-2503.16322" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16322" title="Other formats" id="oth-2503.16322" aria-labelledby="oth-2503.16322">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Ultra-Resolution Adaptation with Ease </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Yu,+R">Ruonan Yu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Liu,+S">Songhua Liu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Tan,+Z">Zhenxiong Tan</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+X">Xinchao Wang</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Technical Report. Codes are available \href{<a href="https://github.com/Huage001/URAE" rel="external noopener nofollow" class="link-external link-https">this https URL</a>}{here} </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item23'>[23]</a> <a href ="/abs/2503.16318" title="Abstract" id="2503.16318"> arXiv:2503.16318 </a> [<a href="/pdf/2503.16318" title="Download PDF" id="pdf-2503.16318" aria-labelledby="pdf-2503.16318">pdf</a>, <a href="https://arxiv.org/html/2503.16318v1" title="View HTML" id="html-2503.16318" aria-labelledby="html-2503.16318" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16318" title="Other formats" id="oth-2503.16318" aria-labelledby="oth-2503.16318">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Dynamic Point Maps: A Versatile Representation for Dynamic 3D Reconstruction </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Sucar,+E">Edgar Sucar</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Lai,+Z">Zihang Lai</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Insafutdinov,+E">Eldar Insafutdinov</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Vedaldi,+A">Andrea Vedaldi</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Web page: <a href="https://www.robots.ox.ac.uk/~vgg/research/dynamic-point-maps/" rel="external noopener nofollow" class="link-external link-https">this https URL</a> </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item24'>[24]</a> <a href ="/abs/2503.16302" title="Abstract" id="2503.16302"> arXiv:2503.16302 </a> [<a href="/pdf/2503.16302" title="Download PDF" id="pdf-2503.16302" aria-labelledby="pdf-2503.16302">pdf</a>, <a href="https://arxiv.org/html/2503.16302v1" title="View HTML" id="html-2503.16302" aria-labelledby="html-2503.16302" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16302" title="Other formats" id="oth-2503.16302" aria-labelledby="oth-2503.16302">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Unleashing Vecset Diffusion Model for Fast Shape Generation </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Lai,+Z">Zeqiang Lai</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhao,+Y">Yunfei Zhao</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhao,+Z">Zibo Zhao</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Liu,+H">Haolin Liu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+F">Fuyun Wang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Shi,+H">Huiwen Shi</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Yang,+X">Xianghui Yang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Lin,+Q">Qinxiang Lin</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Huang,+J">Jinwei Huang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Liu,+Y">Yuhong Liu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Jiang,+J">Jie Jiang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Guo,+C">Chunchao Guo</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Yue,+X">Xiangyu Yue</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Technical report </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Artificial Intelligence (cs.AI); Image and Video Processing (eess.IV) </div> </div> </dd> <dt> <a name='item25'>[25]</a> <a href ="/abs/2503.16289" title="Abstract" id="2503.16289"> arXiv:2503.16289 </a> [<a href="/pdf/2503.16289" title="Download PDF" id="pdf-2503.16289" aria-labelledby="pdf-2503.16289">pdf</a>, <a href="https://arxiv.org/html/2503.16289v1" title="View HTML" id="html-2503.16289" aria-labelledby="html-2503.16289" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16289" title="Other formats" id="oth-2503.16289" aria-labelledby="oth-2503.16289">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> SceneMI: Motion In-betweening for Modeling Human-Scene Interactions </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Hwang,+I">Inwoo Hwang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhou,+B">Bing Zhou</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Kim,+Y+M">Young Min Kim</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+J">Jian Wang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Guo,+C">Chuan Guo</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> 15 pages, Project page: <a href="http://inwoohwang.me/SceneMI" rel="external noopener nofollow" class="link-external link-http">this http URL</a> </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item26'>[26]</a> <a href ="/abs/2503.16284" title="Abstract" id="2503.16284"> arXiv:2503.16284 </a> [<a href="/pdf/2503.16284" title="Download PDF" id="pdf-2503.16284" aria-labelledby="pdf-2503.16284">pdf</a>, <a href="https://arxiv.org/html/2503.16284v1" title="View HTML" id="html-2503.16284" aria-labelledby="html-2503.16284" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16284" title="Other formats" id="oth-2503.16284" aria-labelledby="oth-2503.16284">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> PSA-MIL: A Probabilistic Spatial Attention-Based Multiple Instance Learning for Whole Slide Image Classification </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Peled,+S">Sharon Peled</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Maruvka,+Y+E">Yosef E. Maruvka</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Freiman,+M">Moti Freiman</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> 8 pages, 7 figures </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item27'>[27]</a> <a href ="/abs/2503.16282" title="Abstract" id="2503.16282"> arXiv:2503.16282 </a> [<a href="/pdf/2503.16282" title="Download PDF" id="pdf-2503.16282" aria-labelledby="pdf-2503.16282">pdf</a>, <a href="https://arxiv.org/html/2503.16282v1" title="View HTML" id="html-2503.16282" aria-labelledby="html-2503.16282" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16282" title="Other formats" id="oth-2503.16282" aria-labelledby="oth-2503.16282">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Generalized Few-shot 3D Point Cloud Segmentation with Vision-Language Model </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=An,+Z">Zhaochong An</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Sun,+G">Guolei Sun</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Liu,+Y">Yun Liu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Li,+R">Runjia Li</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Han,+J">Junlin Han</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Konukoglu,+E">Ender Konukoglu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Belongie,+S">Serge Belongie</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Accepted to CVPR 2025 </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item28'>[28]</a> <a href ="/abs/2503.16263" title="Abstract" id="2503.16263"> arXiv:2503.16263 </a> [<a href="/pdf/2503.16263" title="Download PDF" id="pdf-2503.16263" aria-labelledby="pdf-2503.16263">pdf</a>, <a href="https://arxiv.org/html/2503.16263v1" title="View HTML" id="html-2503.16263" aria-labelledby="html-2503.16263" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16263" title="Other formats" id="oth-2503.16263" aria-labelledby="oth-2503.16263">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> From Monocular Vision to Autonomous Action: Guiding Tumor Resection via 3D Reconstruction </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Acar,+A">Ayberk Acar</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Smith,+M">Mariana Smith</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Al-Zogbi,+L">Lidia Al-Zogbi</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Watts,+T">Tanner Watts</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Li,+F">Fangjie Li</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Li,+H">Hao Li</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Yilmaz,+N">Nural Yilmaz</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Scheikl,+P+M">Paul Maria Scheikl</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=d'Almeida,+J+F">Jesse F. d'Almeida</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Sharma,+S">Susheela Sharma</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Branscombe,+L">Lauren Branscombe</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Ertop,+T+E">Tayfun Efe Ertop</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Webster,+R+J">Robert J. Webster III</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Oguz,+I">Ipek Oguz</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Kuntz,+A">Alan Kuntz</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Krieger,+A">Axel Krieger</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wu,+J+Y">Jie Ying Wu</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> 7 Pages, 8 Figures, 1 Table. This work has been submitted IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS) for possible publication </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Robotics (cs.RO) </div> </div> </dd> <dt> <a name='item29'>[29]</a> <a href ="/abs/2503.16260" title="Abstract" id="2503.16260"> arXiv:2503.16260 </a> [<a href="/pdf/2503.16260" title="Download PDF" id="pdf-2503.16260" aria-labelledby="pdf-2503.16260">pdf</a>, <a href="https://arxiv.org/html/2503.16260v1" title="View HTML" id="html-2503.16260" aria-labelledby="html-2503.16260" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16260" title="Other formats" id="oth-2503.16260" aria-labelledby="oth-2503.16260">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Chain of Functions: A Programmatic Pipeline for Fine-Grained Chart Reasoning Data </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Li,+Z">Zijian Li</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Fu,+J">Jingjing Fu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Song,+L">Lei Song</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Bian,+J">Jiang Bian</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhang,+J">Jun Zhang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+R">Rui Wang</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Under review </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item30'>[30]</a> <a href ="/abs/2503.16257" title="Abstract" id="2503.16257"> arXiv:2503.16257 </a> [<a href="/pdf/2503.16257" title="Download PDF" id="pdf-2503.16257" aria-labelledby="pdf-2503.16257">pdf</a>, <a href="https://arxiv.org/html/2503.16257v1" title="View HTML" id="html-2503.16257" aria-labelledby="html-2503.16257" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16257" title="Other formats" id="oth-2503.16257" aria-labelledby="oth-2503.16257">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Plug-and-Play 1.x-Bit KV Cache Quantization for Video Large Language Models </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Tao,+K">Keda Tao</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=You,+H">Haoxuan You</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Sui,+Y">Yang Sui</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Qin,+C">Can Qin</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+H">Huan Wang</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> 12 pages </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item31'>[31]</a> <a href ="/abs/2503.16254" title="Abstract" id="2503.16254"> arXiv:2503.16254 </a> [<a href="/pdf/2503.16254" title="Download PDF" id="pdf-2503.16254" aria-labelledby="pdf-2503.16254">pdf</a>, <a href="https://arxiv.org/html/2503.16254v1" title="View HTML" id="html-2503.16254" aria-labelledby="html-2503.16254" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16254" title="Other formats" id="oth-2503.16254" aria-labelledby="oth-2503.16254">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> M2N2V2: Multi-Modal Unsupervised and Training-free Interactive Segmentation </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Karmann,+M">Markus Karmann</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Jiang,+P">Peng-Tao Jiang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Li,+B">Bo Li</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Urfalioglu,+O">Onay Urfalioglu</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item32'>[32]</a> <a href ="/abs/2503.16247" title="Abstract" id="2503.16247"> arXiv:2503.16247 </a> [<a href="/pdf/2503.16247" title="Download PDF" id="pdf-2503.16247" aria-labelledby="pdf-2503.16247">pdf</a>, <a href="https://arxiv.org/html/2503.16247v1" title="View HTML" id="html-2503.16247" aria-labelledby="html-2503.16247" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16247" title="Other formats" id="oth-2503.16247" aria-labelledby="oth-2503.16247">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> OpenMIBOOD: Open Medical Imaging Benchmarks for Out-Of-Distribution Detection </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Gutbrod,+M">Max Gutbrod</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Rauber,+D">David Rauber</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Nunes,+D+W">Danilo Weber Nunes</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Palm,+C">Christoph Palm</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Machine Learning (cs.LG) </div> </div> </dd> <dt> <a name='item33'>[33]</a> <a href ="/abs/2503.16218" title="Abstract" id="2503.16218"> arXiv:2503.16218 </a> [<a href="/pdf/2503.16218" title="Download PDF" id="pdf-2503.16218" aria-labelledby="pdf-2503.16218">pdf</a>, <a href="https://arxiv.org/html/2503.16218v1" title="View HTML" id="html-2503.16218" aria-labelledby="html-2503.16218" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16218" title="Other formats" id="oth-2503.16218" aria-labelledby="oth-2503.16218">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Temporal Score Analysis for Understanding and Correcting Diffusion Artifacts </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Cao,+Y">Yu Cao</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhao,+Z">Zengqun Zhao</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Patras,+I">Ioannis Patras</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Gong,+S">Shaogang Gong</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item34'>[34]</a> <a href ="/abs/2503.16195" title="Abstract" id="2503.16195"> arXiv:2503.16195 </a> [<a href="/pdf/2503.16195" title="Download PDF" id="pdf-2503.16195" aria-labelledby="pdf-2503.16195">pdf</a>, <a href="https://arxiv.org/html/2503.16195v1" title="View HTML" id="html-2503.16195" aria-labelledby="html-2503.16195" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16195" title="Other formats" id="oth-2503.16195" aria-labelledby="oth-2503.16195">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> VP-NTK: Exploring the Benefits of Visual Prompting in Differentially Private Data Synthesis </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Hsu,+C">Chia-Yi Hsu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Chen,+J">Jia-You Chen</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Tsai,+Y">Yu-Lin Tsai</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Lin,+C">Chih-Hsun Lin</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Chen,+P">Pin-Yu Chen</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Yu,+C">Chia-Mu Yu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Huang,+C">Chun-Ying Huang</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Accepted by ICASSP 2025 </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Machine Learning (cs.LG) </div> </div> </dd> <dt> <a name='item35'>[35]</a> <a href ="/abs/2503.16194" title="Abstract" id="2503.16194"> arXiv:2503.16194 </a> [<a href="/pdf/2503.16194" title="Download PDF" id="pdf-2503.16194" aria-labelledby="pdf-2503.16194">pdf</a>, <a href="https://arxiv.org/html/2503.16194v1" title="View HTML" id="html-2503.16194" aria-labelledby="html-2503.16194" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16194" title="Other formats" id="oth-2503.16194" aria-labelledby="oth-2503.16194">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Improving Autoregressive Image Generation through Coarse-to-Fine Token Prediction </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Guo,+Z">Ziyao Guo</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhang,+K">Kaipeng Zhang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Shieh,+M+Q">Michael Qizhe Shieh</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Work in progress </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item36'>[36]</a> <a href ="/abs/2503.16188" title="Abstract" id="2503.16188"> arXiv:2503.16188 </a> [<a href="/pdf/2503.16188" title="Download PDF" id="pdf-2503.16188" aria-labelledby="pdf-2503.16188">pdf</a>, <a href="https://arxiv.org/html/2503.16188v1" title="View HTML" id="html-2503.16188" aria-labelledby="html-2503.16188" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16188" title="Other formats" id="oth-2503.16188" aria-labelledby="oth-2503.16188">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> CLS-RL: Image Classification with Rule-Based Reinforcement Learning </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Li,+M">Ming Li</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhao,+S">Shitian Zhao</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhong,+J">Jike Zhong</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Lai,+Y">Yuxiang Lai</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhang,+K">Kaipeng Zhang</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Preprint, work in progress </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item37'>[37]</a> <a href ="/abs/2503.16185" title="Abstract" id="2503.16185"> arXiv:2503.16185 </a> [<a href="/pdf/2503.16185" title="Download PDF" id="pdf-2503.16185" aria-labelledby="pdf-2503.16185">pdf</a>, <a href="/format/2503.16185" title="Other formats" id="oth-2503.16185" aria-labelledby="oth-2503.16185">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> MapGlue: Multimodal Remote Sensing Image Matching </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Wu,+P">Peihao Wu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Yao,+Y">Yongxiang Yao</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhang,+W">Wenfei Zhang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wei,+D">Dong Wei</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wan,+Y">Yi Wan</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Li,+Y">Yansheng Li</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhang,+Y">Yongjun Zhang</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> The dataset and code are available at <a href="https://github.com/PeihaoWu/MapGlue" rel="external noopener nofollow" class="link-external link-https">this https URL</a> </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item38'>[38]</a> <a href ="/abs/2503.16184" title="Abstract" id="2503.16184"> arXiv:2503.16184 </a> [<a href="/pdf/2503.16184" title="Download PDF" id="pdf-2503.16184" aria-labelledby="pdf-2503.16184">pdf</a>, <a href="https://arxiv.org/html/2503.16184v1" title="View HTML" id="html-2503.16184" aria-labelledby="html-2503.16184" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16184" title="Other formats" id="oth-2503.16184" aria-labelledby="oth-2503.16184">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Accurate Scene Text Recognition with Efficient Model Scaling and Cloze Self-Distillation </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Maracani,+A">Andrea Maracani</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Ozkan,+S">Savas Ozkan</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Cho,+S">Sijun Cho</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Kim,+H">Hyowon Kim</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Noh,+E">Eunchung Noh</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Min,+J">Jeongwon Min</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Min,+C+J">Cho Jung Min</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Park,+D">Dookun Park</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Ozay,+M">Mete Ozay</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Artificial Intelligence (cs.AI); Computation and Language (cs.CL) </div> </div> </dd> <dt> <a name='item39'>[39]</a> <a href ="/abs/2503.16179" title="Abstract" id="2503.16179"> arXiv:2503.16179 </a> [<a href="/pdf/2503.16179" title="Download PDF" id="pdf-2503.16179" aria-labelledby="pdf-2503.16179">pdf</a>, <a href="https://arxiv.org/html/2503.16179v1" title="View HTML" id="html-2503.16179" aria-labelledby="html-2503.16179" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16179" title="Other formats" id="oth-2503.16179" aria-labelledby="oth-2503.16179">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Narrowing Class-Wise Robustness Gaps in Adversarial Training </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Amerehi,+F">Fatemeh Amerehi</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Healy,+P">Patrick Healy</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> 4 figures, ICLR 2025 Workshop on Foundation Models in the Wild </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Machine Learning (cs.LG) </div> </div> </dd> <dt> <a name='item40'>[40]</a> <a href ="/abs/2503.16171" title="Abstract" id="2503.16171"> arXiv:2503.16171 </a> [<a href="/pdf/2503.16171" title="Download PDF" id="pdf-2503.16171" aria-labelledby="pdf-2503.16171">pdf</a>, <a href="https://arxiv.org/html/2503.16171v1" title="View HTML" id="html-2503.16171" aria-labelledby="html-2503.16171" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16171" title="Other formats" id="oth-2503.16171" aria-labelledby="oth-2503.16171">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Guardians of Generation: Dynamic Inference-Time Copyright Shielding with Adaptive Guidance for AI Image Generation </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Roy,+S">Soham Roy</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Mishra,+A">Abhishek Mishra</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Karande,+S">Shirish Karande</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Mandal,+M">Murari Mandal</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item41'>[41]</a> <a href ="/abs/2503.16165" title="Abstract" id="2503.16165"> arXiv:2503.16165 </a> [<a href="/pdf/2503.16165" title="Download PDF" id="pdf-2503.16165" aria-labelledby="pdf-2503.16165">pdf</a>, <a href="https://arxiv.org/html/2503.16165v1" title="View HTML" id="html-2503.16165" aria-labelledby="html-2503.16165" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16165" title="Other formats" id="oth-2503.16165" aria-labelledby="oth-2503.16165">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Iterative Optimal Attention and Local Model for Single Image Rain Streak Removal </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Li,+X">Xiangyu Li</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Fan,+W">Wanshu Fan</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Shen,+Y">Yue Shen</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+C">Cong Wang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+W">Wei Wang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Yang,+X">Xin Yang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhang,+Q">Qiang Zhang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhou,+D">Dongsheng Zhou</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> 14 pages, 14 figures, 6 tables </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Information Retrieval (cs.IR) </div> </div> </dd> <dt> <a name='item42'>[42]</a> <a href ="/abs/2503.16153" title="Abstract" id="2503.16153"> arXiv:2503.16153 </a> [<a href="/pdf/2503.16153" title="Download PDF" id="pdf-2503.16153" aria-labelledby="pdf-2503.16153">pdf</a>, <a href="https://arxiv.org/html/2503.16153v1" title="View HTML" id="html-2503.16153" aria-labelledby="html-2503.16153" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16153" title="Other formats" id="oth-2503.16153" aria-labelledby="oth-2503.16153">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> FreeFlux: Understanding and Exploiting Layer-Specific Roles in RoPE-Based MMDiT for Versatile Image Editing </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Wei,+T">Tianyi Wei</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhou,+Y">Yifan Zhou</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Chen,+D">Dongdong Chen</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Pan,+X">Xingang Pan</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Project page: <a href="https://wtybest.github.io/projects/FreeFlux/" rel="external noopener nofollow" class="link-external link-https">this https URL</a> </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item43'>[43]</a> <a href ="/abs/2503.16134" title="Abstract" id="2503.16134"> arXiv:2503.16134 </a> [<a href="/pdf/2503.16134" title="Download PDF" id="pdf-2503.16134" aria-labelledby="pdf-2503.16134">pdf</a>, <a href="/format/2503.16134" title="Other formats" id="oth-2503.16134" aria-labelledby="oth-2503.16134">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Binarized Mamba-Transformer for Lightweight Quad Bayer HybridEVS Demosaicing </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Zhou,+S">Shiyang Zhou</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zeng,+H">Haijin Zeng</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Lu,+Y">Yunfan Lu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Shao,+T">Tong Shao</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Tang,+K">Ke Tang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Chen,+Y">Yongyong Chen</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Liu,+J">Jie Liu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Su,+J">Jingyong Su</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Accepted by CVPR 2025 </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item44'>[44]</a> <a href ="/abs/2503.16128" title="Abstract" id="2503.16128"> arXiv:2503.16128 </a> [<a href="/pdf/2503.16128" title="Download PDF" id="pdf-2503.16128" aria-labelledby="pdf-2503.16128">pdf</a>, <a href="https://arxiv.org/html/2503.16128v1" title="View HTML" id="html-2503.16128" aria-labelledby="html-2503.16128" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16128" title="Other formats" id="oth-2503.16128" aria-labelledby="oth-2503.16128">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Coupling deep and handcrafted features to assess smile genuineness </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Pawlus,+B">Benedykt Pawlus</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Smolka,+B">Bogdan Smolka</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Kawulok,+J">Jolanta Kawulok</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Kawulok,+M">Michal Kawulok</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Submitted to SPIE Defense + Commercial Sensing 2024 </div> <div class='list-journal-ref'><span class='descriptor'>Journal-ref:</span> Proc. SPIE 13034, Real-Time Image Processing and Deep Learning 2024 </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item45'>[45]</a> <a href ="/abs/2503.16125" title="Abstract" id="2503.16125"> arXiv:2503.16125 </a> [<a href="/pdf/2503.16125" title="Download PDF" id="pdf-2503.16125" aria-labelledby="pdf-2503.16125">pdf</a>, <a href="https://arxiv.org/html/2503.16125v1" title="View HTML" id="html-2503.16125" aria-labelledby="html-2503.16125" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16125" title="Other formats" id="oth-2503.16125" aria-labelledby="oth-2503.16125">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Uncertainty Meets Diversity: A Comprehensive Active Learning Framework for Indoor 3D Object Detection </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+J">Jiangyi Wang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhao,+N">Na Zhao</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Accepted by CVPR 2025 </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item46'>[46]</a> <a href ="/abs/2503.16120" title="Abstract" id="2503.16120"> arXiv:2503.16120 </a> [<a href="/pdf/2503.16120" title="Download PDF" id="pdf-2503.16120" aria-labelledby="pdf-2503.16120">pdf</a>, <a href="https://arxiv.org/html/2503.16120v1" title="View HTML" id="html-2503.16120" aria-labelledby="html-2503.16120" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16120" title="Other formats" id="oth-2503.16120" aria-labelledby="oth-2503.16120">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Probabilistic Prompt Distribution Learning for Animal Pose Estimation </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Rao,+J">Jiyong Rao</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhao,+B+N">Brian Nlong Zhao</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+Y">Yu Wang</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Accepted by CVPR 2025 </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item47'>[47]</a> <a href ="/abs/2503.16106" title="Abstract" id="2503.16106"> arXiv:2503.16106 </a> [<a href="/pdf/2503.16106" title="Download PDF" id="pdf-2503.16106" aria-labelledby="pdf-2503.16106">pdf</a>, <a href="https://arxiv.org/html/2503.16106v1" title="View HTML" id="html-2503.16106" aria-labelledby="html-2503.16106" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16106" title="Other formats" id="oth-2503.16106" aria-labelledby="oth-2503.16106">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> OSLoPrompt: Bridging Low-Supervision Challenges and Open-Set Domain Generalization in CLIP </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=C,+M+H+N">Mohamad Hassan N C</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Gupta,+D">Divyam Gupta</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Singha,+M">Mainak Singha</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Rongali,+S+B">Sai Bhargav Rongali</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Jha,+A">Ankit Jha</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Khan,+M+H">Muhammad Haris Khan</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Banerjee,+B">Biplab Banerjee</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Accepted to CVPR 2025 </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item48'>[48]</a> <a href ="/abs/2503.16096" title="Abstract" id="2503.16096"> arXiv:2503.16096 </a> [<a href="/pdf/2503.16096" title="Download PDF" id="pdf-2503.16096" aria-labelledby="pdf-2503.16096">pdf</a>, <a href="/format/2503.16096" title="Other formats" id="oth-2503.16096" aria-labelledby="oth-2503.16096">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> MarkushGrapher: Joint Visual and Textual Recognition of Markush Structures </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Morin,+L">Lucas Morin</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Weber,+V">Val茅ry Weber</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Nassar,+A">Ahmed Nassar</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Meijer,+G+I">Gerhard Ingmar Meijer</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Van+Gool,+L">Luc Van Gool</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Li,+Y">Yawei Li</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Staar,+P">Peter Staar</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> <dt> <a name='item49'>[49]</a> <a href ="/abs/2503.16086" title="Abstract" id="2503.16086"> arXiv:2503.16086 </a> [<a href="/pdf/2503.16086" title="Download PDF" id="pdf-2503.16086" aria-labelledby="pdf-2503.16086">pdf</a>, <a href="https://arxiv.org/html/2503.16086v1" title="View HTML" id="html-2503.16086" aria-labelledby="html-2503.16086" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16086" title="Other formats" id="oth-2503.16086" aria-labelledby="oth-2503.16086">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Hyperspectral Imaging for Identifying Foreign Objects on Pork Belly </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Ghimpeteanu,+G">Gabriela Ghimpeteanu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Rajani,+H">Hayat Rajani</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Quintana,+J">Josep Quintana</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Garcia,+R">Rafael Garcia</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Article under review by Computers in Industry, Elsevier </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Machine Learning (cs.LG) </div> </div> </dd> <dt> <a name='item50'>[50]</a> <a href ="/abs/2503.16069" title="Abstract" id="2503.16069"> arXiv:2503.16069 </a> [<a href="/pdf/2503.16069" title="Download PDF" id="pdf-2503.16069" aria-labelledby="pdf-2503.16069">pdf</a>, <a href="https://arxiv.org/html/2503.16069v1" title="View HTML" id="html-2503.16069" aria-labelledby="html-2503.16069" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2503.16069" title="Other formats" id="oth-2503.16069" aria-labelledby="oth-2503.16069">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Disentangled and Interpretable Multimodal Attention Fusion for Cancer Survival Prediction </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Eijpe,+A">Aniek Eijpe</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Lakbir,+S">Soufyan Lakbir</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Cesur,+M+E">Melis Erdal Cesur</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Oliveira,+S+P">Sara P. Oliveira</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Abeln,+S">Sanne Abeln</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Silva,+W">Wilson Silva</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> 11 pages, 1 figure, 3 tables </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span> </div> </div> </dd> </dl> <div class='paging'>Total of 993 entries : <span>1-50</span> <a href=/list/cs.CV/recent?skip=50&show=50>51-100</a> <a href=/list/cs.CV/recent?skip=100&show=50>101-150</a> <a href=/list/cs.CV/recent?skip=150&show=50>151-200</a> <span>...</span> <a href=/list/cs.CV/recent?skip=950&show=50>951-993</a> </div> <div class='morefewer'>Showing up to 50 entries per page: <a href=/list/cs.CV/recent?skip=0&show=25 rel="nofollow"> fewer</a> | <a href=/list/cs.CV/recent?skip=0&show=100 rel="nofollow"> more</a> | <a href=/list/cs.CV/recent?skip=0&show=2000 rel="nofollow"> all</a> </div> </div> </div> </div> </main> <footer style="clear: both;"> <div class="columns is-desktop" role="navigation" aria-label="Secondary" style="margin: -0.75em -0.75em 0.75em -0.75em">  <div class="column" style="padding: 0;"> <div class="columns"> <div class="column"> <ul style="list-style: none; line-height: 2;"> <li><a href="https://info.arxiv.org/about">About</a></li> <li><a href="https://info.arxiv.org/help">Help</a></li> </ul> </div> <div class="column"> <ul style="list-style: none; line-height: 2;"> <li> <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 512 512" class="icon filter-black" role="presentation"><title>contact arXiv</title><desc>Click here to contact arXiv</desc><path d="M502.3 190.8c3.9-3.1 9.7-.2 9.7 4.7V400c0 26.5-21.5 48-48 48H48c-26.5 0-48-21.5-48-48V195.6c0-5 5.7-7.8 9.7-4.7 22.4 17.4 52.1 39.5 154.1 113.6 21.1 15.4 56.7 47.8 92.2 47.6 35.7.3 72-32.8 92.3-47.6 102-74.1 131.6-96.3 154-113.7zM256 320c23.2.4 56.6-29.2 73.4-41.4 132.7-96.3 142.8-104.7 173.4-128.7 5.8-4.5 9.2-11.5 9.2-18.9v-19c0-26.5-21.5-48-48-48H48C21.5 64 0 85.5 0 112v19c0 7.4 3.4 14.3 9.2 18.9 30.6 23.9 40.7 32.4 173.4 128.7 16.8 12.2 50.2 41.8 73.4 41.4z"/></svg> <a href="https://info.arxiv.org/help/contact.html"> Contact</a> </li> <li> <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 512 512" class="icon filter-black" role="presentation"><title>subscribe to arXiv mailings</title><desc>Click here to subscribe</desc><path d="M476 3.2L12.5 270.6c-18.1 10.4-15.8 35.6 2.2 43.2L121 358.4l287.3-253.2c5.5-4.9 13.3 2.6 8.6 8.3L176 407v80.5c0 23.6 28.5 32.9 42.5 15.8L282 426l124.6 52.2c14.2 6 30.4-2.9 33-18.2l72-432C515 7.8 493.3-6.8 476 3.2z"/></svg> <a href="https://info.arxiv.org/help/subscribe"> Subscribe</a> </li> </ul> </div> </div> </div>   <div class="column" style="padding: 0;"> <div class="columns"> <div class="column"> <ul style="list-style: none; line-height: 2;"> <li><a href="https://info.arxiv.org/help/license/index.html">Copyright</a></li> <li><a href="https://info.arxiv.org/help/policies/privacy_policy.html">Privacy Policy</a></li> </ul> </div> <div class="column sorry-app-links"> <ul style="list-style: none; line-height: 2;"> <li><a href="https://info.arxiv.org/help/web_accessibility.html">Web Accessibility Assistance</a></li> <li> <p class="help"> <a class="a11y-main-link" href="https://status.arxiv.org" target="_blank">arXiv Operational Status <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 256 512" class="icon filter-dark_grey" role="presentation"><path d="M224.3 273l-136 136c-9.4 9.4-24.6 9.4-33.9 0l-22.6-22.6c-9.4-9.4-9.4-24.6 0-33.9l96.4-96.4-96.4-96.4c-9.4-9.4-9.4-24.6 0-33.9L54.3 103c9.4-9.4 24.6-9.4 33.9 0l136 136c9.5 9.4 9.5 24.6.1 34z"/></svg></a><br> Get status notifications via <a class="is-link" href="https://subscribe.sorryapp.com/24846f03/email/new" target="_blank"><svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 512 512" class="icon filter-black" role="presentation"><path d="M502.3 190.8c3.9-3.1 9.7-.2 9.7 4.7V400c0 26.5-21.5 48-48 48H48c-26.5 0-48-21.5-48-48V195.6c0-5 5.7-7.8 9.7-4.7 22.4 17.4 52.1 39.5 154.1 113.6 21.1 15.4 56.7 47.8 92.2 47.6 35.7.3 72-32.8 92.3-47.6 102-74.1 131.6-96.3 154-113.7zM256 320c23.2.4 56.6-29.2 73.4-41.4 132.7-96.3 142.8-104.7 173.4-128.7 5.8-4.5 9.2-11.5 9.2-18.9v-19c0-26.5-21.5-48-48-48H48C21.5 64 0 85.5 0 112v19c0 7.4 3.4 14.3 9.2 18.9 30.6 23.9 40.7 32.4 173.4 128.7 16.8 12.2 50.2 41.8 73.4 41.4z"/></svg>email</a> or <a class="is-link" href="https://subscribe.sorryapp.com/24846f03/slack/new" target="_blank"><svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 448 512" class="icon filter-black" role="presentation"><path d="M94.12 315.1c0 25.9-21.16 47.06-47.06 47.06S0 341 0 315.1c0-25.9 21.16-47.06 47.06-47.06h47.06v47.06zm23.72 0c0-25.9 21.16-47.06 47.06-47.06s47.06 21.16 47.06 47.06v117.84c0 25.9-21.16 47.06-47.06 47.06s-47.06-21.16-47.06-47.06V315.1zm47.06-188.98c-25.9 0-47.06-21.16-47.06-47.06S139 32 164.9 32s47.06 21.16 47.06 47.06v47.06H164.9zm0 23.72c25.9 0 47.06 21.16 47.06 47.06s-21.16 47.06-47.06 47.06H47.06C21.16 243.96 0 222.8 0 196.9s21.16-47.06 47.06-47.06H164.9zm188.98 47.06c0-25.9 21.16-47.06 47.06-47.06 25.9 0 47.06 21.16 47.06 47.06s-21.16 47.06-47.06 47.06h-47.06V196.9zm-23.72 0c0 25.9-21.16 47.06-47.06 47.06-25.9 0-47.06-21.16-47.06-47.06V79.06c0-25.9 21.16-47.06 47.06-47.06 25.9 0 47.06 21.16 47.06 47.06V196.9zM283.1 385.88c25.9 0 47.06 21.16 47.06 47.06 0 25.9-21.16 47.06-47.06 47.06-25.9 0-47.06-21.16-47.06-47.06v-47.06h47.06zm0-23.72c-25.9 0-47.06-21.16-47.06-47.06 0-25.9 21.16-47.06 47.06-47.06h117.84c25.9 0 47.06 21.16 47.06 47.06 0 25.9-21.16 47.06-47.06 47.06H283.1z"/></svg>slack</a> </p> </li> </ul> </div> </div> </div>   </div> </footer> </div> <script src="/static/base/1.0.1/js/member_acknowledgement.js"></script> </body> </html>

CINXE.COM

Computer Vision and Pattern Recognition