CINXE.COM
Multimedia
<?xml version="1.0" encoding="UTF-8"?> <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd"> <html xmlns="http://www.w3.org/1999/xhtml" lang="en" xml:lang="en"> <head> <title>Multimedia </title> <meta name="viewport" content="width=device-width, initial-scale=1"> <link rel="apple-touch-icon" sizes="180x180" href="/static/browse/0.3.4/images/icons/apple-touch-icon.png"> <link rel="icon" type="image/png" sizes="32x32" href="/static/browse/0.3.4/images/icons/favicon-32x32.png"> <link rel="icon" type="image/png" sizes="16x16" href="/static/browse/0.3.4/images/icons/favicon-16x16.png"> <link rel="manifest" href="/static/browse/0.3.4/images/icons/site.webmanifest"> <link rel="mask-icon" href="/static/browse/0.3.4/images/icons/safari-pinned-tab.svg" color="#5bbad5"> <meta name="msapplication-TileColor" content="#da532c"> <meta name="theme-color" content="#ffffff"> <link rel="stylesheet" type="text/css" media="screen" href="/static/browse/0.3.4/css/arXiv.css?v=20240822" /> <link rel="stylesheet" type="text/css" media="print" href="/static/browse/0.3.4/css/arXiv-print.css?v=20200611" /> <link rel="stylesheet" type="text/css" media="screen" href="/static/browse/0.3.4/css/browse_search.css" /> <script language="javascript" src="/static/browse/0.3.4/js/accordion.js" /></script> <script src="/static/browse/0.3.4/js/mathjaxToggle.min.js" type="text/javascript"></script> <script type="text/javascript" language="javascript">mathjaxToggle();</script> </head> <body class="with-cu-identity"> <div class="flex-wrap-footer"> <header> <a href="#content" class="is-sr-only">Skip to main content</a> <!-- start desktop header --> <div class="columns is-vcentered is-hidden-mobile" id="cu-identity"> <div class="column" id="cu-logo"> <a href="https://www.cornell.edu/"><img src="/static/browse/0.3.4/images/icons/cu/cornell-reduced-white-SMALL.svg" alt="Cornell University" /></a> </div><div class="column" id="support-ack"> <span id="support-ack-url">We gratefully acknowledge support from the Simons Foundation, <a href="https://info.arxiv.org/about/ourmembers.html">member institutions</a>, and all contributors.</span> <a href="https://info.arxiv.org/about/donate.html" class="btn-header-donate">Donate</a> </div> </div> <div id="header" class="is-hidden-mobile"> <a aria-hidden="true" tabindex="-1" href="/IgnoreMe"></a> <div class="header-breadcrumbs"> <a href="/"><img src="/static/browse/0.3.4/images/arxiv-logo-one-color-white.svg" alt="arxiv logo" style="height:40px;"/></a> <span>></span> <a href="/list/cs.MM/recent">cs.MM</a> </div> <div class="search-block level-right"> <form class="level-item mini-search" method="GET" action="https://arxiv.org/search"> <div class="field has-addons"> <div class="control"> <input class="input is-small" type="text" name="query" placeholder="Search..." aria-label="Search term or terms" /> <p class="help"><a href="https://info.arxiv.org/help">Help</a> | <a href="https://arxiv.org/search/advanced">Advanced Search</a></p> </div> <div class="control"> <div class="select is-small"> <select name="searchtype" aria-label="Field to search"> <option value="all" selected="selected">All fields</option> <option value="title">Title</option> <option value="author">Author</option> <option value="abstract">Abstract</option> <option value="comments">Comments</option> <option value="journal_ref">Journal reference</option> <option value="acm_class">ACM classification</option> <option value="msc_class">MSC classification</option> <option value="report_num">Report number</option> <option value="paper_id">arXiv identifier</option> <option value="doi">DOI</option> <option value="orcid">ORCID</option> <option value="author_id">arXiv author ID</option> <option value="help">Help pages</option> <option value="full_text">Full text</option> </select> </div> </div> <input type="hidden" name="source" value="header"> <button class="button is-small is-cul-darker">Search</button> </div> </form> </div> </div><!-- /end desktop header --> <div class="mobile-header"> <div class="columns is-mobile"> <div class="column logo-arxiv"><a href="https://arxiv.org/"><img src="/static/browse/0.3.4/images/arxiv-logomark-small-white.svg" alt="arXiv logo" style="height:60px;" /></a></div> <div class="column logo-cornell"><a href="https://www.cornell.edu/"> <picture> <source media="(min-width: 501px)" srcset="/static/browse/0.3.4/images/icons/cu/cornell-reduced-white-SMALL.svg 400w" sizes="400w" /> <source srcset="/static/browse/0.3.4/images/icons/cu/cornell_seal_simple_black.svg 2x" /> <img src="/static/browse/0.3.4/images/icons/cu/cornell-reduced-white-SMALL.svg" alt="Cornell University Logo" /> </picture> </a></div> <div class="column nav" id="toggle-container" role="menubar"> <button class="toggle-control"><svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 512 512" class="icon filter-white"><title>open search</title><path d="M505 442.7L405.3 343c-4.5-4.5-10.6-7-17-7H372c27.6-35.3 44-79.7 44-128C416 93.1 322.9 0 208 0S0 93.1 0 208s93.1 208 208 208c48.3 0 92.7-16.4 128-44v16.3c0 6.4 2.5 12.5 7 17l99.7 99.7c9.4 9.4 24.6 9.4 33.9 0l28.3-28.3c9.4-9.4 9.4-24.6.1-34zM208 336c-70.7 0-128-57.2-128-128 0-70.7 57.2-128 128-128 70.7 0 128 57.2 128 128 0 70.7-57.2 128-128 128z"/></svg></button> <div class="mobile-toggle-block toggle-target"> <form class="mobile-search-form" method="GET" action="https://arxiv.org/search"> <div class="field has-addons"> <input class="input" type="text" name="query" placeholder="Search..." aria-label="Search term or terms" /> <input type="hidden" name="source" value="header"> <input type="hidden" name="searchtype" value="all"> <button class="button">GO</button> </div> </form> </div> <button class="toggle-control"><svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 448 512" class="icon filter-white" role="menu"><title>open navigation menu</title><path d="M16 132h416c8.837 0 16-7.163 16-16V76c0-8.837-7.163-16-16-16H16C7.163 60 0 67.163 0 76v40c0 8.837 7.163 16 16 16zm0 160h416c8.837 0 16-7.163 16-16v-40c0-8.837-7.163-16-16-16H16c-8.837 0-16 7.163-16 16v40c0 8.837 7.163 16 16 16zm0 160h416c8.837 0 16-7.163 16-16v-40c0-8.837-7.163-16-16-16H16c-8.837 0-16 7.163-16 16v40c0 8.837 7.163 16 16 16z"/ ></svg></button> <div class="mobile-toggle-block toggle-target"> <nav class="mobile-menu" aria-labelledby="mobilemenulabel"> <h2 id="mobilemenulabel">quick links</h2> <ul> <li><a href="https://arxiv.org/login">Login</a></li> <li><a href="https://info.arxiv.org/help">Help Pages</a></li> <li><a href="https://info.arxiv.org/about">About</a></li> </ul> </nav> </div> </div> </div> </div><!-- /end mobile-header --> </header> <main> <div id="content"> <div id='content-inner'> <div id='dlpage'> <h1>Multimedia</h1> <h2>Authors and titles for recent submissions</h2> <ul> <li> <a href="/list/cs.MM/recent?skip=0&show=50"> Fri, 22 Nov 2024 </a> </li><li> <a href="/list/cs.MM/recent?skip=6&show=50"> Thu, 21 Nov 2024 </a> </li><li> <a href="/list/cs.MM/recent?skip=10&show=50"> Wed, 20 Nov 2024 </a> </li><li> <a href="/list/cs.MM/recent?skip=14&show=50"> Tue, 19 Nov 2024 </a> </li><li> <a href="/list/cs.MM/recent?skip=20&show=50"> Mon, 18 Nov 2024 </a> </li></ul> <p>See today's <a id="new-cs.MM" aria-labelledby="new-cs.MM" href="/list/cs.MM/new">new</a> changes</p> <div class='paging'>Total of 26 entries </div> <div class='morefewer'>Showing up to 50 entries per page: <a href=/list/cs.MM/recent?skip=0&show=25 rel="nofollow"> fewer</a> | <span style="color: #454545">more</span> | <span style="color: #454545">all</span> </div> <dl id='articles'> <h3>Fri, 22 Nov 2024 (showing 6 of 6 entries )</h3> <dt> <a name='item1'>[1]</a> <a href ="/abs/2411.13917" title="Abstract" id="2411.13917"> arXiv:2411.13917 </a> [<a href="/pdf/2411.13917" title="Download PDF" id="pdf-2411.13917" aria-labelledby="pdf-2411.13917">pdf</a>, <a href="https://arxiv.org/html/2411.13917v1" title="View HTML" id="html-2411.13917" aria-labelledby="html-2411.13917" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.13917" title="Other formats" id="oth-2411.13917" aria-labelledby="oth-2411.13917">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> SpikEmo: Enhancing Emotion Recognition With Spiking Temporal Dynamics in Conversations </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Yu,+X">Xiaomin Yu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+F">Feiyang Wang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Qiao,+Z">Ziyue Qiao</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Multimedia (cs.MM)</span> </div> </div> </dd> <dt> <a name='item2'>[2]</a> <a href ="/abs/2411.14207" title="Abstract" id="2411.14207"> arXiv:2411.14207 </a> (cross-list from cs.SD) [<a href="/pdf/2411.14207" title="Download PDF" id="pdf-2411.14207" aria-labelledby="pdf-2411.14207">pdf</a>, <a href="https://arxiv.org/html/2411.14207v1" title="View HTML" id="html-2411.14207" aria-labelledby="html-2411.14207" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.14207" title="Other formats" id="oth-2411.14207" aria-labelledby="oth-2411.14207">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> HARP: A Large-Scale Higher-Order Ambisonic Room Impulse Response Dataset </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Saini,+S">Shivam Saini</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Peissig,+J">J眉rgen Peissig</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Submitted to ICASSP 2025 Workshop Dataset and code to be uploaded at: <a href="https://github.com/whojavumusic/HARP" rel="external noopener nofollow" class="link-external link-https">this https URL</a> </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Sound (cs.SD)</span>; Artificial Intelligence (cs.AI); Multimedia (cs.MM); Audio and Speech Processing (eess.AS) </div> </div> </dd> <dt> <a name='item3'>[3]</a> <a href ="/abs/2411.14135" title="Abstract" id="2411.14135"> arXiv:2411.14135 </a> (cross-list from eess.IV) [<a href="/pdf/2411.14135" title="Download PDF" id="pdf-2411.14135" aria-labelledby="pdf-2411.14135">pdf</a>, <a href="https://arxiv.org/html/2411.14135v1" title="View HTML" id="html-2411.14135" aria-labelledby="html-2411.14135" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.14135" title="Other formats" id="oth-2411.14135" aria-labelledby="oth-2411.14135">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Compact Visual Data Representation for Green Multimedia -- A Human Visual System Perspective </div> <div class='list-authors'><a href="https://arxiv.org/search/eess?searchtype=author&query=Chen,+P">Peilin Chen</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Fang,+X">Xiaohan Fang</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Wang,+M">Meng Wang</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Wang,+S">Shiqi Wang</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Ma,+S">Siwei Ma</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Image and Video Processing (eess.IV)</span>; Multimedia (cs.MM) </div> </div> </dd> <dt> <a name='item4'>[4]</a> <a href ="/abs/2411.13819" title="Abstract" id="2411.13819"> arXiv:2411.13819 </a> (cross-list from cs.CR) [<a href="/pdf/2411.13819" title="Download PDF" id="pdf-2411.13819" aria-labelledby="pdf-2411.13819">pdf</a>, <a href="https://arxiv.org/html/2411.13819v1" title="View HTML" id="html-2411.13819" aria-labelledby="html-2411.13819" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.13819" title="Other formats" id="oth-2411.13819" aria-labelledby="oth-2411.13819">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Robust Steganography with Boundary-Preserving Overflow Alleviation and Adaptive Error Correction </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Cheng,+Y">Yu Cheng</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Luo,+Z">Zhenlin Luo</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Yin,+Z">Zhaoxia Yin</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Cryptography and Security (cs.CR)</span>; Multimedia (cs.MM) </div> </div> </dd> <dt> <a name='item5'>[5]</a> <a href ="/abs/2411.13811" title="Abstract" id="2411.13811"> arXiv:2411.13811 </a> (cross-list from cs.SD) [<a href="/pdf/2411.13811" title="Download PDF" id="pdf-2411.13811" aria-labelledby="pdf-2411.13811">pdf</a>, <a href="https://arxiv.org/html/2411.13811v1" title="View HTML" id="html-2411.13811" aria-labelledby="html-2411.13811" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.13811" title="Other formats" id="oth-2411.13811" aria-labelledby="oth-2411.13811">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> X-CrossNet: A complex spectral mapping approach to target speaker extraction with cross attention speaker embedding fusion </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Sun,+C">Chang Sun</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Qin,+B">Bo Qin</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Sound (cs.SD)</span>; Multimedia (cs.MM); Audio and Speech Processing (eess.AS) </div> </div> </dd> <dt> <a name='item6'>[6]</a> <a href ="/abs/2411.13577" title="Abstract" id="2411.13577"> arXiv:2411.13577 </a> (cross-list from eess.AS) [<a href="/pdf/2411.13577" title="Download PDF" id="pdf-2411.13577" aria-labelledby="pdf-2411.13577">pdf</a>, <a href="https://arxiv.org/html/2411.13577v1" title="View HTML" id="html-2411.13577" aria-labelledby="html-2411.13577" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.13577" title="Other formats" id="oth-2411.13577" aria-labelledby="oth-2411.13577">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> WavChat: A Survey of Spoken Dialogue Models </div> <div class='list-authors'><a href="https://arxiv.org/search/eess?searchtype=author&query=Ji,+S">Shengpeng Ji</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Chen,+Y">Yifu Chen</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Fang,+M">Minghui Fang</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Zuo,+J">Jialong Zuo</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Lu,+J">Jingyu Lu</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Wang,+H">Hanting Wang</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Jiang,+Z">Ziyue Jiang</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Zhou,+L">Long Zhou</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Liu,+S">Shujie Liu</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Cheng,+X">Xize Cheng</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Yang,+X">Xiaoda Yang</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Wang,+Z">Zehan Wang</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Yang,+Q">Qian Yang</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Li,+J">Jian Li</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Jiang,+Y">Yidi Jiang</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=He,+J">Jingzhen He</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Chu,+Y">Yunfei Chu</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Xu,+J">Jin Xu</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Zhao,+Z">Zhou Zhao</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> 60 papes, working in progress </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Audio and Speech Processing (eess.AS)</span>; Computation and Language (cs.CL); Machine Learning (cs.LG); Multimedia (cs.MM); Sound (cs.SD) </div> </div> </dd> </dl> <dl id='articles'> <h3>Thu, 21 Nov 2024 (showing 4 of 4 entries )</h3> <dt> <a name='item7'>[7]</a> <a href ="/abs/2411.12907" title="Abstract" id="2411.12907"> arXiv:2411.12907 </a> [<a href="/pdf/2411.12907" title="Download PDF" id="pdf-2411.12907" aria-labelledby="pdf-2411.12907">pdf</a>, <a href="https://arxiv.org/html/2411.12907v1" title="View HTML" id="html-2411.12907" aria-labelledby="html-2411.12907" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.12907" title="Other formats" id="oth-2411.12907" aria-labelledby="oth-2411.12907">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Narrative Information Theory </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Schulz,+L">Lion Schulz</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Patr%C3%ADcio,+M">Miguel Patr铆cio</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Odijk,+D">Daan Odijk</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> To be published in NeurIPS 2024 Workshop on Creativity & Generative AI. 7 pages, 3 figures </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Multimedia (cs.MM)</span>; Information Theory (cs.IT) </div> </div> </dd> <dt> <a name='item8'>[8]</a> <a href ="/abs/2411.12825" title="Abstract" id="2411.12825"> arXiv:2411.12825 </a> [<a href="/pdf/2411.12825" title="Download PDF" id="pdf-2411.12825" aria-labelledby="pdf-2411.12825">pdf</a>, <a href="https://arxiv.org/html/2411.12825v1" title="View HTML" id="html-2411.12825" aria-labelledby="html-2411.12825" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.12825" title="Other formats" id="oth-2411.12825" aria-labelledby="oth-2411.12825">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> TopoCode: Topologically Informed Error Detection and Correction in Communication Systems </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Guo,+H">Hongzhi Guo</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Multimedia (cs.MM)</span> </div> </div> </dd> <dt> <a name='item9'>[9]</a> <a href ="/abs/2411.13536" title="Abstract" id="2411.13536"> arXiv:2411.13536 </a> (cross-list from cs.CV) [<a href="/pdf/2411.13536" title="Download PDF" id="pdf-2411.13536" aria-labelledby="pdf-2411.13536">pdf</a>, <a href="https://arxiv.org/html/2411.13536v1" title="View HTML" id="html-2411.13536" aria-labelledby="html-2411.13536" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.13536" title="Other formats" id="oth-2411.13536" aria-labelledby="oth-2411.13536">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Identity Preserving 3D Head Stylization with Multiview Score Distillation </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Bilecen,+B+B">Bahri Batuhan Bilecen</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Gokmen,+A+B">Ahmet Berke Gokmen</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Guzelant,+F">Furkan Guzelant</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Dundar,+A">Aysegul Dundar</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> <a href="https://three-bee.github.io/head_stylization" rel="external noopener nofollow" class="link-external link-https">this https URL</a> </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Artificial Intelligence (cs.AI); Graphics (cs.GR); Machine Learning (cs.LG); Multimedia (cs.MM) </div> </div> </dd> <dt> <a name='item10'>[10]</a> <a href ="/abs/2411.13281" title="Abstract" id="2411.13281"> arXiv:2411.13281 </a> (cross-list from cs.CV) [<a href="/pdf/2411.13281" title="Download PDF" id="pdf-2411.13281" aria-labelledby="pdf-2411.13281">pdf</a>, <a href="https://arxiv.org/html/2411.13281v1" title="View HTML" id="html-2411.13281" aria-labelledby="html-2411.13281" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.13281" title="Other formats" id="oth-2411.13281" aria-labelledby="oth-2411.13281">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> VideoAutoArena: An Automated Arena for Evaluating Large Multimodal Models in Video Analysis through User Simulation </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Luo,+Z">Ziyang Luo</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wu,+H">Haoning Wu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Li,+D">Dongxu Li</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Ma,+J">Jing Ma</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Kankanhalli,+M">Mohan Kankanhalli</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Li,+J">Junnan Li</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Project Page: <a href="https://videoautoarena.github.io/" rel="external noopener nofollow" class="link-external link-https">this https URL</a> </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Artificial Intelligence (cs.AI); Computation and Language (cs.CL); Multimedia (cs.MM) </div> </div> </dd> </dl> <dl id='articles'> <h3>Wed, 20 Nov 2024 (showing 4 of 4 entries )</h3> <dt> <a name='item11'>[11]</a> <a href ="/abs/2411.12293" title="Abstract" id="2411.12293"> arXiv:2411.12293 </a> (cross-list from cs.CV) [<a href="/pdf/2411.12293" title="Download PDF" id="pdf-2411.12293" aria-labelledby="pdf-2411.12293">pdf</a>, <a href="https://arxiv.org/html/2411.12293v1" title="View HTML" id="html-2411.12293" aria-labelledby="html-2411.12293" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.12293" title="Other formats" id="oth-2411.12293" aria-labelledby="oth-2411.12293">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Generative Timelines for Instructed Visual Assembly </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Pardo,+A">Alejandro Pardo</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+J">Jui-Hsien Wang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Ghanem,+B">Bernard Ghanem</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Sivic,+J">Josef Sivic</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Russell,+B">Bryan Russell</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Heilbron,+F+C">Fabian Caba Heilbron</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Human-Computer Interaction (cs.HC); Multimedia (cs.MM) </div> </div> </dd> <dt> <a name='item12'>[12]</a> <a href ="/abs/2411.12197" title="Abstract" id="2411.12197"> arXiv:2411.12197 </a> (cross-list from cs.CV) [<a href="/pdf/2411.12197" title="Download PDF" id="pdf-2411.12197" aria-labelledby="pdf-2411.12197">pdf</a>, <a href="https://arxiv.org/html/2411.12197v1" title="View HTML" id="html-2411.12197" aria-labelledby="html-2411.12197" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.12197" title="Other formats" id="oth-2411.12197" aria-labelledby="oth-2411.12197">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> MTFusion: Reconstructing Any 3D Object from Single Image Using Multi-word Textual Inversion </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Liu,+Y">Yu Liu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+R">Ruowei Wang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Li,+J">Jiaqi Li</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Xu,+Z">Zixiang Xu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhao,+Q">Qijun Zhao</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> PRCV 2024 </div> <div class='list-journal-ref'><span class='descriptor'>Journal-ref:</span> Pattern Recognition and Computer Vision (2025), Springer Nature Singapore, pages 166-180, ISBN 978-981-97-8508-7 </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Multimedia (cs.MM) </div> </div> </dd> <dt> <a name='item13'>[13]</a> <a href ="/abs/2411.12072" title="Abstract" id="2411.12072"> arXiv:2411.12072 </a> (cross-list from cs.CV) [<a href="/pdf/2411.12072" title="Download PDF" id="pdf-2411.12072" aria-labelledby="pdf-2411.12072">pdf</a>, <a href="https://arxiv.org/html/2411.12072v1" title="View HTML" id="html-2411.12072" aria-labelledby="html-2411.12072" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.12072" title="Other formats" id="oth-2411.12072" aria-labelledby="oth-2411.12072">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Zoomed In, Diffused Out: Towards Local Degradation-Aware Multi-Diffusion for Extreme Image Super-Resolution </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Moser,+B+B">Brian B. Moser</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Frolov,+S">Stanislav Frolov</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Nauen,+T+C">Tobias C. Nauen</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Raue,+F">Federico Raue</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Dengel,+A">Andreas Dengel</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Artificial Intelligence (cs.AI); Machine Learning (cs.LG); Multimedia (cs.MM) </div> </div> </dd> <dt> <a name='item14'>[14]</a> <a href ="/abs/2411.12008" title="Abstract" id="2411.12008"> arXiv:2411.12008 </a> (cross-list from cs.SD) [<a href="/pdf/2411.12008" title="Download PDF" id="pdf-2411.12008" aria-labelledby="pdf-2411.12008">pdf</a>, <a href="https://arxiv.org/html/2411.12008v1" title="View HTML" id="html-2411.12008" aria-labelledby="html-2411.12008" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.12008" title="Other formats" id="oth-2411.12008" aria-labelledby="oth-2411.12008">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Compression of Higher Order Ambisonics with Multichannel RVQGAN </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Hirvonen,+T">Toni Hirvonen</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Namazi,+M">Mahmoud Namazi</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Sound (cs.SD)</span>; Machine Learning (cs.LG); Multimedia (cs.MM); Audio and Speech Processing (eess.AS) </div> </div> </dd> </dl> <dl id='articles'> <h3>Tue, 19 Nov 2024 (showing 6 of 6 entries )</h3> <dt> <a name='item15'>[15]</a> <a href ="/abs/2411.11688" title="Abstract" id="2411.11688"> arXiv:2411.11688 </a> (cross-list from cs.CR) [<a href="/pdf/2411.11688" title="Download PDF" id="pdf-2411.11688" aria-labelledby="pdf-2411.11688">pdf</a>, <a href="https://arxiv.org/html/2411.11688v1" title="View HTML" id="html-2411.11688" aria-labelledby="html-2411.11688" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.11688" title="Other formats" id="oth-2411.11688" aria-labelledby="oth-2411.11688">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Conceptwm: A Diffusion Model Watermark for Concept Protection </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Lei,+L">Liangqi Lei</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Gai,+K">Keke Gai</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Yu,+J">Jing Yu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhu,+L">Liehuang Zhu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wu,+Q">Qi Wu</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Cryptography and Security (cs.CR)</span>; Artificial Intelligence (cs.AI); Multimedia (cs.MM) </div> </div> </dd> <dt> <a name='item16'>[16]</a> <a href ="/abs/2411.11278" title="Abstract" id="2411.11278"> arXiv:2411.11278 </a> (cross-list from cs.CV) [<a href="/pdf/2411.11278" title="Download PDF" id="pdf-2411.11278" aria-labelledby="pdf-2411.11278">pdf</a>, <a href="https://arxiv.org/html/2411.11278v1" title="View HTML" id="html-2411.11278" aria-labelledby="html-2411.11278" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.11278" title="Other formats" id="oth-2411.11278" aria-labelledby="oth-2411.11278">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Towards Open-Vocabulary Audio-Visual Event Localization </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Zhou,+J">Jinxing Zhou</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Guo,+D">Dan Guo</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Guo,+R">Ruohao Guo</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Mao,+Y">Yuxin Mao</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Hu,+J">Jingjing Hu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhong,+Y">Yiran Zhong</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Chang,+X">Xiaojun Chang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+M">Meng Wang</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Project page: <a href="https://github.com/jasongief/OV-AVEL" rel="external noopener nofollow" class="link-external link-https">this https URL</a> </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Multimedia (cs.MM) </div> </div> </dd> <dt> <a name='item17'>[17]</a> <a href ="/abs/2411.11222" title="Abstract" id="2411.11222"> arXiv:2411.11222 </a> (cross-list from cs.CV) [<a href="/pdf/2411.11222" title="Download PDF" id="pdf-2411.11222" aria-labelledby="pdf-2411.11222">pdf</a>, <a href="/format/2411.11222" title="Other formats" id="oth-2411.11222" aria-labelledby="oth-2411.11222">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> The Sound of Water: Inferring Physical Properties from Pouring Liquids </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Bagad,+P">Piyush Bagad</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Tapaswi,+M">Makarand Tapaswi</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Snoek,+C+G+M">Cees G. M. Snoek</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zisserman,+A">Andrew Zisserman</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> 25 pages, 17 figures. Project page at <a href="https://bpiyush.github.io/pouring-water-website" rel="external noopener nofollow" class="link-external link-https">this https URL</a> </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Multimedia (cs.MM); Sound (cs.SD); Audio and Speech Processing (eess.AS) </div> </div> </dd> <dt> <a name='item18'>[18]</a> <a href ="/abs/2411.10775" title="Abstract" id="2411.10775"> arXiv:2411.10775 </a> (cross-list from eess.IV) [<a href="/pdf/2411.10775" title="Download PDF" id="pdf-2411.10775" aria-labelledby="pdf-2411.10775">pdf</a>, <a href="https://arxiv.org/html/2411.10775v1" title="View HTML" id="html-2411.10775" aria-labelledby="html-2411.10775" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.10775" title="Other formats" id="oth-2411.10775" aria-labelledby="oth-2411.10775">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Beyond Feature Mapping GAP: Integrating Real HDRTV Priors for Superior SDRTV-to-HDRTV Conversion </div> <div class='list-authors'><a href="https://arxiv.org/search/eess?searchtype=author&query=Xu,+K">Kepeng Xu</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Xu,+L">Li Xu</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=He,+G">Gang He</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Zhang,+Z">Zhiqiang Zhang</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Yu,+W">Wenxin Yu</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Wang,+S">Shihao Wang</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Zhou,+D">Dajiang Zhou</a>, <a href="https://arxiv.org/search/eess?searchtype=author&query=Li,+Y">Yunsong Li</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> 8 pages,4 figures </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Image and Video Processing (eess.IV)</span>; Computer Vision and Pattern Recognition (cs.CV); Multimedia (cs.MM) </div> </div> </dd> <dt> <a name='item19'>[19]</a> <a href ="/abs/2411.10513" title="Abstract" id="2411.10513"> arXiv:2411.10513 </a> (cross-list from cs.CV) [<a href="/pdf/2411.10513" title="Download PDF" id="pdf-2411.10513" aria-labelledby="pdf-2411.10513">pdf</a>, <a href="https://arxiv.org/html/2411.10513v1" title="View HTML" id="html-2411.10513" aria-labelledby="html-2411.10513" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.10513" title="Other formats" id="oth-2411.10513" aria-labelledby="oth-2411.10513">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Any2Any: Incomplete Multimodal Retrieval with Conformal Prediction </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Li,+P">Po-han Li</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Yang,+Y">Yunhao Yang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Omama,+M">Mohammad Omama</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Chinchali,+S">Sandeep Chinchali</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Topcu,+U">Ufuk Topcu</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Information Retrieval (cs.IR); Multimedia (cs.MM) </div> </div> </dd> <dt> <a name='item20'>[20]</a> <a href ="/abs/2411.10480" title="Abstract" id="2411.10480"> arXiv:2411.10480 </a> (cross-list from cs.CV) [<a href="/pdf/2411.10480" title="Download PDF" id="pdf-2411.10480" aria-labelledby="pdf-2411.10480">pdf</a>, <a href="https://arxiv.org/html/2411.10480v1" title="View HTML" id="html-2411.10480" aria-labelledby="html-2411.10480" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.10480" title="Other formats" id="oth-2411.10480" aria-labelledby="oth-2411.10480">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Hateful Meme Detection through Context-Sensitive Prompting and Fine-Grained Labeling </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Ouyang,+R">Rongxin Ouyang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Jaidka,+K">Kokil Jaidka</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Mukerjee,+S">Subhayan Mukerjee</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Cui,+G">Guangyu Cui</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> AAAI-25 Student Abstract, Oral Presentation </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Artificial Intelligence (cs.AI); Computation and Language (cs.CL); Machine Learning (cs.LG); Multimedia (cs.MM) </div> </div> </dd> </dl> <dl id='articles'> <h3>Mon, 18 Nov 2024 (showing 6 of 6 entries )</h3> <dt> <a name='item21'>[21]</a> <a href ="/abs/2411.10060" title="Abstract" id="2411.10060"> arXiv:2411.10060 </a> [<a href="/pdf/2411.10060" title="Download PDF" id="pdf-2411.10060" aria-labelledby="pdf-2411.10060">pdf</a>, <a href="https://arxiv.org/html/2411.10060v1" title="View HTML" id="html-2411.10060" aria-labelledby="html-2411.10060" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.10060" title="Other formats" id="oth-2411.10060" aria-labelledby="oth-2411.10060">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> CMATH: Cross-Modality Augmented Transformer with Hierarchical Variational Distillation for Multimodal Emotion Recognition in Conversation </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Zhu,+X">Xiaofei Zhu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Cheng,+J">Jiawei Cheng</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Yang,+Z">Zhou Yang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Chen,+Z">Zhuo Chen</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Wang,+Q">Qingyang Wang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Yao,+J">Jianfeng Yao</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Multimedia (cs.MM)</span>; Computation and Language (cs.CL) </div> </div> </dd> <dt> <a name='item22'>[22]</a> <a href ="/abs/2411.10436" title="Abstract" id="2411.10436"> arXiv:2411.10436 </a> (cross-list from cs.CL) [<a href="/pdf/2411.10436" title="Download PDF" id="pdf-2411.10436" aria-labelledby="pdf-2411.10436">pdf</a>, <a href="https://arxiv.org/html/2411.10436v1" title="View HTML" id="html-2411.10436" aria-labelledby="html-2411.10436" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.10436" title="Other formats" id="oth-2411.10436" aria-labelledby="oth-2411.10436">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Mitigating Hallucination in Multimodal Large Language Model via Hallucination-targeted Direct Preference Optimization </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Fu,+Y">Yuhan Fu</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Xie,+R">Ruobing Xie</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Sun,+X">Xingwu Sun</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Kang,+Z">Zhanhui Kang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Li,+X">Xirong Li</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computation and Language (cs.CL)</span>; Artificial Intelligence (cs.AI); Computer Vision and Pattern Recognition (cs.CV); Multimedia (cs.MM) </div> </div> </dd> <dt> <a name='item23'>[23]</a> <a href ="/abs/2411.10231" title="Abstract" id="2411.10231"> arXiv:2411.10231 </a> (cross-list from cs.CV) [<a href="/pdf/2411.10231" title="Download PDF" id="pdf-2411.10231" aria-labelledby="pdf-2411.10231">pdf</a>, <a href="https://arxiv.org/html/2411.10231v1" title="View HTML" id="html-2411.10231" aria-labelledby="html-2411.10231" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.10231" title="Other formats" id="oth-2411.10231" aria-labelledby="oth-2411.10231">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> A Low-Resolution Image is Worth 1x1 Words: Enabling Fine Image Super-Resolution with Transformers and TaylorShift </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Nagaraju,+S+B">Sanath Budakegowdanadoddi Nagaraju</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Moser,+B+B">Brian Bernhard Moser</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Nauen,+T+C">Tobias Christian Nauen</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Frolov,+S">Stanislav Frolov</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Raue,+F">Federico Raue</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Dengel,+A">Andreas Dengel</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Artificial Intelligence (cs.AI); Machine Learning (cs.LG); Multimedia (cs.MM) </div> </div> </dd> <dt> <a name='item24'>[24]</a> <a href ="/abs/2411.10034" title="Abstract" id="2411.10034"> arXiv:2411.10034 </a> (cross-list from cs.CR) [<a href="/pdf/2411.10034" title="Download PDF" id="pdf-2411.10034" aria-labelledby="pdf-2411.10034">pdf</a>, <a href="https://arxiv.org/html/2411.10034v1" title="View HTML" id="html-2411.10034" aria-labelledby="html-2411.10034" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.10034" title="Other formats" id="oth-2411.10034" aria-labelledby="oth-2411.10034">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> EveGuard: Defeating Vibration-based Side-Channel Eavesdropping with Audio Adversarial Perturbations </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Chang,+J">Jung-Woo Chang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Sun,+K">Ke Sun</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Xia,+D">David Xia</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Zhang,+X">Xinyu Zhang</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Koushanfar,+F">Farinaz Koushanfar</a></div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Cryptography and Security (cs.CR)</span>; Multimedia (cs.MM); Sound (cs.SD); Audio and Speech Processing (eess.AS) </div> </div> </dd> <dt> <a name='item25'>[25]</a> <a href ="/abs/2411.09955" title="Abstract" id="2411.09955"> arXiv:2411.09955 </a> (cross-list from cs.CV) [<a href="/pdf/2411.09955" title="Download PDF" id="pdf-2411.09955" aria-labelledby="pdf-2411.09955">pdf</a>, <a href="https://arxiv.org/html/2411.09955v2" title="View HTML" id="html-2411.09955" aria-labelledby="html-2411.09955" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.09955" title="Other formats" id="oth-2411.09955" aria-labelledby="oth-2411.09955">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> Instruction-Guided Editing Controls for Images and Multimedia: A Survey in LLM era </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Nguyen,+T+T">Thanh Tam Nguyen</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Ren,+Z">Zhao Ren</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Pham,+T">Trinh Pham</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Huynh,+T+T">Thanh Trung Huynh</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Nguyen,+P+L">Phi Le Nguyen</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Yin,+H">Hongzhi Yin</a>, <a href="https://arxiv.org/search/cs?searchtype=author&query=Nguyen,+Q+V+H">Quoc Viet Hung Nguyen</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> Fixed a serious error in author information </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Artificial Intelligence (cs.AI); Human-Computer Interaction (cs.HC); Machine Learning (cs.LG); Multimedia (cs.MM) </div> </div> </dd> <dt> <a name='item26'>[26]</a> <a href ="/abs/2411.09952" title="Abstract" id="2411.09952"> arXiv:2411.09952 </a> (cross-list from cs.CV) [<a href="/pdf/2411.09952" title="Download PDF" id="pdf-2411.09952" aria-labelledby="pdf-2411.09952">pdf</a>, <a href="https://arxiv.org/html/2411.09952v1" title="View HTML" id="html-2411.09952" aria-labelledby="html-2411.09952" rel="noopener noreferrer" target="_blank">html</a>, <a href="/format/2411.09952" title="Other formats" id="oth-2411.09952" aria-labelledby="oth-2411.09952">other</a>] </dt> <dd> <div class='meta'> <div class='list-title mathjax'><span class='descriptor'>Title:</span> GGAvatar: Reconstructing Garment-Separated 3D Gaussian Splatting Avatars from Monocular Video </div> <div class='list-authors'><a href="https://arxiv.org/search/cs?searchtype=author&query=Chen,+J">Jingxuan Chen</a></div> <div class='list-comments mathjax'><span class='descriptor'>Comments:</span> MMAsia'24 Accepted </div> <div class='list-subjects'><span class='descriptor'>Subjects:</span> <span class="primary-subject">Computer Vision and Pattern Recognition (cs.CV)</span>; Artificial Intelligence (cs.AI); Multimedia (cs.MM) </div> </div> </dd> </dl> <div class='paging'>Total of 26 entries </div> <div class='morefewer'>Showing up to 50 entries per page: <a href=/list/cs.MM/recent?skip=0&show=25 rel="nofollow"> fewer</a> | <span style="color: #454545">more</span> | <span style="color: #454545">all</span> </div> </div> </div> </div> </main> <footer style="clear: both;"> <div class="columns is-desktop" role="navigation" aria-label="Secondary" style="margin: -0.75em -0.75em 0.75em -0.75em"> <!-- Macro-Column 1 --> <div class="column" style="padding: 0;"> <div class="columns"> <div class="column"> <ul style="list-style: none; line-height: 2;"> <li><a href="https://info.arxiv.org/about">About</a></li> <li><a href="https://info.arxiv.org/help">Help</a></li> </ul> </div> <div class="column"> <ul style="list-style: none; line-height: 2;"> <li> <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 512 512" class="icon filter-black" role="presentation"><title>contact arXiv</title><desc>Click here to contact arXiv</desc><path d="M502.3 190.8c3.9-3.1 9.7-.2 9.7 4.7V400c0 26.5-21.5 48-48 48H48c-26.5 0-48-21.5-48-48V195.6c0-5 5.7-7.8 9.7-4.7 22.4 17.4 52.1 39.5 154.1 113.6 21.1 15.4 56.7 47.8 92.2 47.6 35.7.3 72-32.8 92.3-47.6 102-74.1 131.6-96.3 154-113.7zM256 320c23.2.4 56.6-29.2 73.4-41.4 132.7-96.3 142.8-104.7 173.4-128.7 5.8-4.5 9.2-11.5 9.2-18.9v-19c0-26.5-21.5-48-48-48H48C21.5 64 0 85.5 0 112v19c0 7.4 3.4 14.3 9.2 18.9 30.6 23.9 40.7 32.4 173.4 128.7 16.8 12.2 50.2 41.8 73.4 41.4z"/></svg> <a href="https://info.arxiv.org/help/contact.html"> Contact</a> </li> <li> <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 512 512" class="icon filter-black" role="presentation"><title>subscribe to arXiv mailings</title><desc>Click here to subscribe</desc><path d="M476 3.2L12.5 270.6c-18.1 10.4-15.8 35.6 2.2 43.2L121 358.4l287.3-253.2c5.5-4.9 13.3 2.6 8.6 8.3L176 407v80.5c0 23.6 28.5 32.9 42.5 15.8L282 426l124.6 52.2c14.2 6 30.4-2.9 33-18.2l72-432C515 7.8 493.3-6.8 476 3.2z"/></svg> <a href="https://info.arxiv.org/help/subscribe"> Subscribe</a> </li> </ul> </div> </div> </div> <!-- End Macro-Column 1 --> <!-- Macro-Column 2 --> <div class="column" style="padding: 0;"> <div class="columns"> <div class="column"> <ul style="list-style: none; line-height: 2;"> <li><a href="https://info.arxiv.org/help/license/index.html">Copyright</a></li> <li><a href="https://info.arxiv.org/help/policies/privacy_policy.html">Privacy Policy</a></li> </ul> </div> <div class="column sorry-app-links"> <ul style="list-style: none; line-height: 2;"> <li><a href="https://info.arxiv.org/help/web_accessibility.html">Web Accessibility Assistance</a></li> <li> <p class="help"> <a class="a11y-main-link" href="https://status.arxiv.org" target="_blank">arXiv Operational Status <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 256 512" class="icon filter-dark_grey" role="presentation"><path d="M224.3 273l-136 136c-9.4 9.4-24.6 9.4-33.9 0l-22.6-22.6c-9.4-9.4-9.4-24.6 0-33.9l96.4-96.4-96.4-96.4c-9.4-9.4-9.4-24.6 0-33.9L54.3 103c9.4-9.4 24.6-9.4 33.9 0l136 136c9.5 9.4 9.5 24.6.1 34z"/></svg></a><br> Get status notifications via <a class="is-link" href="https://subscribe.sorryapp.com/24846f03/email/new" target="_blank"><svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 512 512" class="icon filter-black" role="presentation"><path d="M502.3 190.8c3.9-3.1 9.7-.2 9.7 4.7V400c0 26.5-21.5 48-48 48H48c-26.5 0-48-21.5-48-48V195.6c0-5 5.7-7.8 9.7-4.7 22.4 17.4 52.1 39.5 154.1 113.6 21.1 15.4 56.7 47.8 92.2 47.6 35.7.3 72-32.8 92.3-47.6 102-74.1 131.6-96.3 154-113.7zM256 320c23.2.4 56.6-29.2 73.4-41.4 132.7-96.3 142.8-104.7 173.4-128.7 5.8-4.5 9.2-11.5 9.2-18.9v-19c0-26.5-21.5-48-48-48H48C21.5 64 0 85.5 0 112v19c0 7.4 3.4 14.3 9.2 18.9 30.6 23.9 40.7 32.4 173.4 128.7 16.8 12.2 50.2 41.8 73.4 41.4z"/></svg>email</a> or <a class="is-link" href="https://subscribe.sorryapp.com/24846f03/slack/new" target="_blank"><svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 448 512" class="icon filter-black" role="presentation"><path d="M94.12 315.1c0 25.9-21.16 47.06-47.06 47.06S0 341 0 315.1c0-25.9 21.16-47.06 47.06-47.06h47.06v47.06zm23.72 0c0-25.9 21.16-47.06 47.06-47.06s47.06 21.16 47.06 47.06v117.84c0 25.9-21.16 47.06-47.06 47.06s-47.06-21.16-47.06-47.06V315.1zm47.06-188.98c-25.9 0-47.06-21.16-47.06-47.06S139 32 164.9 32s47.06 21.16 47.06 47.06v47.06H164.9zm0 23.72c25.9 0 47.06 21.16 47.06 47.06s-21.16 47.06-47.06 47.06H47.06C21.16 243.96 0 222.8 0 196.9s21.16-47.06 47.06-47.06H164.9zm188.98 47.06c0-25.9 21.16-47.06 47.06-47.06 25.9 0 47.06 21.16 47.06 47.06s-21.16 47.06-47.06 47.06h-47.06V196.9zm-23.72 0c0 25.9-21.16 47.06-47.06 47.06-25.9 0-47.06-21.16-47.06-47.06V79.06c0-25.9 21.16-47.06 47.06-47.06 25.9 0 47.06 21.16 47.06 47.06V196.9zM283.1 385.88c25.9 0 47.06 21.16 47.06 47.06 0 25.9-21.16 47.06-47.06 47.06-25.9 0-47.06-21.16-47.06-47.06v-47.06h47.06zm0-23.72c-25.9 0-47.06-21.16-47.06-47.06 0-25.9 21.16-47.06 47.06-47.06h117.84c25.9 0 47.06 21.16 47.06 47.06 0 25.9-21.16 47.06-47.06 47.06H283.1z"/></svg>slack</a> </p> </li> </ul> </div> </div> </div> <!-- end MetaColumn 2 --> <!-- End Macro-Column 2 --> </div> </footer> </div> <script src="/static/base/1.0.1/js/member_acknowledgement.js"></script> </body> </html>