CINXE.COM

Video Generation | Papers With Code

<!doctype html> <html lang="en"> <head> <meta charset="utf-8"> <meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no"> <script> const GTAG_ENABLED = true ; const GTAG_TRACKING_ID = "UA-121182717-1"; const SENTRY_DSN_FRONTEND = "".trim(); const GLOBAL_CSRF_TOKEN = 'Cq1cGLauLKtR3YGHHaLI2DQ6UtlZsdclF2EfE4ZldFDG0nFHB77zMMABqECLSEDb'; const MEDIA_URL = "https://production-media.paperswithcode.com/"; const ASSETS_URL = "https://production-assets.paperswithcode.com"; run_after_frontend_loaded = window.run_after_frontend_loaded || []; </script> <link rel="preconnect" href="https://production-assets.paperswithcode.com"><link rel="dns-prefetch" href="https://production-assets.paperswithcode.com"><link rel="preload" as="font" type="font/woff2" href="https://production-assets.paperswithcode.com/perf/fonts/65e877e527022735c1a1.woff2" crossorigin><link rel="preload" as="font" type="font/woff2" href="https://production-assets.paperswithcode.com/perf/fonts/917632e36982ca7933c8.woff2" crossorigin><link rel="preload" as="font" type="font/woff2" href="https://production-assets.paperswithcode.com/perf/fonts/f1405bd8a987c2ea8a67.woff2" crossorigin><script>(()=>{if(GTAG_ENABLED){const t=document.createElement("script");function n(){window.dataLayer.push(arguments)}t.src=`https://www.googletagmanager.com/gtag/js?id=${GTAG_TRACKING_ID}`,document.head.appendChild(t),window.dataLayer=window.dataLayer||[],window.gtag=n,n("js",new Date),n("config",GTAG_TRACKING_ID),window.captureOutboundLink=function(t){n("event","click",{event_category:"outbound",event_label:t})}}else window.captureOutboundLink=function(n){document.location=n}})();</script><link rel="preload" as="script" href="https://production-assets.paperswithcode.com/perf/766.4af6b88b.js"><link rel="preload" as="script" href="https://production-assets.paperswithcode.com/perf/2.6da00df7.js"><link rel="preload" as="script" href="https://production-assets.paperswithcode.com/perf/351.a22a9607.js"><link rel="preload" as="script" href="https://production-assets.paperswithcode.com/perf/101.5f271f23.js"><link rel="preload" as="style" href="https://production-assets.paperswithcode.com/perf/918.c41196c3.css"><link rel="preload" as="style" href="https://production-assets.paperswithcode.com/perf/view_task.8e3945a3.css"><link rel="preload" as="script" href="https://production-assets.paperswithcode.com/perf/view_task.e61ab167.js"><link rel="stylesheet" href="https://production-assets.paperswithcode.com/perf/918.c41196c3.css"><link rel="stylesheet" href="https://production-assets.paperswithcode.com/perf/view_task.8e3945a3.css"> <!-- Metadata --> <title>Video Generation | Papers With Code</title> <meta name="description" content="&lt;span style=&quot;color:grey; opacity: 0.6&quot;&gt;( Various Video Generation Tasks. Gif credit: [MaGViT](https://paperswithcode.com/paper/magvit-masked-generative-video-transformer) )&lt;/span&gt;" /> <!-- Open Graph protocol metadata --> <meta property="og:title" content="Papers with Code - Video Generation"> <meta property="og:description" content="&lt;span style=&quot;color:grey; opacity: 0.6&quot;&gt;( Various Video Generation Tasks. Gif credit: [MaGViT](https://paperswithcode.com/paper/magvit-masked-generative-video-transformer) )&lt;/span&gt;"> <meta property="og:image" content="https://production-media.paperswithcode.com/tasks/fae9be37-f327-44c5-b788-312c64aefef6.gif"> <meta property="og:url" content="https://paperswithcode.com/task/video-generation"> <!-- Twitter metadata --> <meta name="twitter:card" content="summary_large_image"> <meta name="twitter:site" content="@paperswithcode"> <meta name="twitter:title" content="Papers with Code - Video Generation"> <meta name="twitter:description" content="&lt;span style=&quot;color:grey; opacity: 0.6&quot;&gt;( Various Video Generation Tasks. Gif credit: [MaGViT](https://paperswithcode.com/paper/magvit-masked-generative-video-transformer) )&lt;/span&gt;"> <meta name="twitter:creator" content="@paperswithcode"> <meta name="twitter:url" content="https://paperswithcode.com/task/video-generation"> <meta name="twitter:domain" content="paperswithcode.com"> <!-- JSON LD --> <script type="application/ld+json">{ "@context": "http://schema.org", "@graph": { "@type": "CreativeWork", "@id": "video-generation", "name": "Video Generation", "description": "\u003Cspan style=\"color:grey; opacity: 0.6\"\u003E( Various Video Generation Tasks.\r\nGif credit: [MaGViT](https://paperswithcode.com/paper/magvit-masked-generative-video-transformer) )\u003C/span\u003E", "url": "https://paperswithcode.com/task/video-generation", "image": "https://production-media.paperswithcode.com/tasks/fae9be37-f327-44c5-b788-312c64aefef6.gif", "subjectOf": [ { "@type": "CreativeWork", "@id": "video", "name": "Video", "description": "", "image": "https://production-media.paperswithcode.com/tasks/default.gif", "subjectOf": [ { "@type": "CreativeWork", "@id": "computer-vision", "name": "Computer Vision", "description": "Browse 1547 tasks \u2022 3353 datasets \u2022 5183 ", "image": "https://paperswithcode.com/static/sota.jpeg", "headline": "Browse state-of-the-art in ML leaderboards \u2022 57150 papers with code." } ], "headline": "Video" }, { "@type": "CreativeWork", "@id": "computer-vision", "name": "Computer Vision", "description": "Browse 1547 tasks \u2022 3353 datasets \u2022 5183 ", "image": "https://paperswithcode.com/static/sota.jpeg", "headline": "Browse state-of-the-art in ML leaderboards \u2022 57150 papers with code." } ], "headline": "Video Generation" } }</script> <meta name="theme-color" content="#fff"/> <link rel="manifest" href="https://production-assets.paperswithcode.com/static/manifest.web.json"> </head> <body> <nav class="navbar navbar-expand-lg navbar-light header"> <a class="navbar-brand" href="/"> <span class=" icon-wrapper" data-name="pwc"><svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 512 512"><path d="M88 128h48v256H88zm144 0h48v256h-48zm-72 16h48v224h-48zm144 0h48v224h-48zm72-16h48v256h-48z"/><path d="M104 104V56H16v400h88v-48H64V104zm304-48v48h40v304h-40v48h88V56z"/></svg></span> </a> <div class="navbar-mobile-twitter d-lg-none"> <a rel="noreferrer" href="https://twitter.com/paperswithcode"> <span class=" icon-wrapper icon-fa icon-fa-brands" data-name="twitter"><svg viewBox="0 0 512.001 515.25" xmlns="http://www.w3.org/2000/svg"><path d="M459.37 152.016c.326 4.548.326 9.097.326 13.645 0 138.72-105.583 298.558-298.559 298.558C101.685 464.22 46.457 447 0 417.114c8.447.973 16.568 1.298 25.34 1.298 49.054 0 94.213-16.568 130.274-44.832-46.132-.975-84.792-31.188-98.113-72.772 6.499.975 12.996 1.624 19.819 1.624 9.42 0 18.843-1.3 27.613-3.573-48.08-9.747-84.142-51.98-84.142-102.984v-1.3c13.968 7.798 30.213 12.67 47.43 13.32-28.263-18.843-46.78-51.006-46.78-87.391 0-19.492 5.196-37.36 14.294-52.954 51.654 63.674 129.3 105.258 216.364 109.807-1.624-7.797-2.599-15.918-2.599-24.04 0-57.827 46.782-104.934 104.934-104.934 30.214 0 57.502 12.67 76.671 33.136 23.715-4.548 46.455-13.319 66.599-25.34-7.798 24.367-24.366 44.834-46.132 57.828 21.117-2.274 41.584-8.122 60.426-16.244-14.292 20.791-32.161 39.309-52.628 54.253z"/></svg></span> </a> </div> <button class="navbar-toggler" type="button" data-toggle="collapse" data-bs-toggle="collapse" data-target="#top-menu" data-bs-target="#top-menu" aria-controls="top-menu" aria-expanded="false" aria-label="Toggle navigation" > <span class="navbar-toggler-icon"></span> </button> <div class="collapse navbar-collapse" id="top-menu"> <ul class="navbar-nav mr-auto navbar-nav__left light-header"> <li class="nav-item header-search"> <form action="/search" method="get" id="id_global_search_form" autocomplete="off"> <input type="text" name="q_meta" style="display:none" id="q_meta" /> <input type="hidden" name="q_type" id="q_type" /> <input id="id_global_search_input" autocomplete="off" value="" name='q' class="global-search" type="search" placeholder='Search'/> <button type="submit" class="icon"><span class=" icon-wrapper icon-fa icon-fa-light" data-name="search"><svg viewBox="0 0 512.025 520.146" xmlns="http://www.w3.org/2000/svg"><path d="M508.5 482.6c4.7 4.7 4.7 12.3 0 17l-9.9 9.9c-4.7 4.7-12.3 4.7-17 0l-129-129c-2.2-2.3-3.5-5.3-3.5-8.5v-10.2C312 396 262.5 417 208 417 93.1 417 0 323.9 0 209S93.1 1 208 1s208 93.1 208 208c0 54.5-21 104-55.3 141.1H371c3.2 0 6.2 1.2 8.5 3.5zM208 385c97.3 0 176-78.7 176-176S305.3 33 208 33 32 111.7 32 209s78.7 176 176 176z"/></svg></span></button> </form> </li> <li class="nav-item"> <a class="nav-link" href="/sota"> Browse State-of-the-Art </a> </li> <li class="nav-item"> <a class="nav-link" href="/datasets"> Datasets </a> </li> <li class="nav-item"> <a class="nav-link" href="/methods">Methods</a> </li> <li class="nav-item dropdown"> <a class="nav-link dropdown-toggle" role="button" id="navbarDropdownRepro" data-toggle="dropdown" data-bs-toggle="dropdown" aria-haspopup="true" aria-expanded="false" > More </a> <div class="dropdown-menu" aria-labelledby="navbarDropdownRepro"> <a class="dropdown-item" href="/newsletter">Newsletter</a> <a class="dropdown-item" href="/rc2022">RC2022</a> <div class="dropdown-divider"></div> <a class="dropdown-item" href="/about">About</a> <a class="dropdown-item" href="/trends">Trends</a> <a class="dropdown-item" href="https://portal.paperswithcode.com/"> Portals </a> <a class="dropdown-item" href="/libraries"> Libraries </a> </div> </li> </ul> <ul class="navbar-nav ml-auto navbar-nav__right navbar-subscribe justify-content-center align-items-center"> <li class="nav-item"> <a class="nav-link" rel="noreferrer" href="https://twitter.com/paperswithcode"> <span class="nav-link-social-icon icon-wrapper icon-fa icon-fa-brands" data-name="twitter"><svg viewBox="0 0 512.001 515.25" xmlns="http://www.w3.org/2000/svg"><path d="M459.37 152.016c.326 4.548.326 9.097.326 13.645 0 138.72-105.583 298.558-298.559 298.558C101.685 464.22 46.457 447 0 417.114c8.447.973 16.568 1.298 25.34 1.298 49.054 0 94.213-16.568 130.274-44.832-46.132-.975-84.792-31.188-98.113-72.772 6.499.975 12.996 1.624 19.819 1.624 9.42 0 18.843-1.3 27.613-3.573-48.08-9.747-84.142-51.98-84.142-102.984v-1.3c13.968 7.798 30.213 12.67 47.43 13.32-28.263-18.843-46.78-51.006-46.78-87.391 0-19.492 5.196-37.36 14.294-52.954 51.654 63.674 129.3 105.258 216.364 109.807-1.624-7.797-2.599-15.918-2.599-24.04 0-57.827 46.782-104.934 104.934-104.934 30.214 0 57.502 12.67 76.671 33.136 23.715-4.548 46.455-13.319 66.599-25.34-7.798 24.367-24.366 44.834-46.132 57.828 21.117-2.274 41.584-8.122 60.426-16.244-14.292 20.791-32.161 39.309-52.628 54.253z"/></svg></span> </a> </li> <li class="nav-item"> <a id="signin-link" class="nav-link" href="/accounts/login?next=/task/video-generation">Sign In</a> </li> </ul> </div> </nav> <!-- Page modals --> <div class="modal fade" id="emailModal" tabindex="-1" role="dialog" aria-labelledby="emailModalLabel" aria-hidden="true"> <div class="modal-dialog" role="document"> <div class="modal-content"> <div class="modal-header"> <h3 class="modal-title" id="emailModalLabel">Subscribe to the PwC Newsletter</h3> <button type="button" class="close" data-dismiss="modal" data-bs-dismiss="modal" aria-label="Close"> <span aria-hidden="true">&times;</span> </button> </div> <form action="" method="post"> <div class="modal-body"> <div class="modal-body-info-text"> Stay informed on the latest trending ML papers with code, research developments, libraries, methods, and datasets.<br/><br/> <a href="/newsletter">Read previous issues</a> </div> <input type="hidden" name="csrfmiddlewaretoken" value="Cq1cGLauLKtR3YGHHaLI2DQ6UtlZsdclF2EfE4ZldFDG0nFHB77zMMABqECLSEDb"> <input placeholder="Enter your email" type="email" class="form-control pwc-email" name="address" id="id_address" max_length="100" required> </div> <div class="modal-footer"> <button type="submit" class="btn btn-primary">Subscribe</button> </div> </form> </div> </div> </div> <!-- Login --> <div class="modal fade" id="loginModal" tabindex="-1" role="dialog" aria-labelledby="loginModalLabel" aria-hidden="true"> <div class="modal-dialog" role="document"> <div class="modal-content"> <div class="modal-header"> <h5 class="modal-title" id="loginModalLabel">Join the community</h5> <button type="button" class="close btn-close" data-dismiss="modal" data-bs-dismiss="modal" aria-label="Close"> <span aria-hidden="true">&times;</span> </button> </div> <div class="login-modal-message"> You need to <a href="/accounts/login?next=/task/video-generation">log in</a> to edit.<br/> You can <a href="/accounts/register?next=/task/video-generation">create a new account</a> if you don't have one.<br/><br/> </div> </div> </div> </div> <!-- Modals go here --> <!-- Edit Task --> <div class="modal fade" id="editTask" role="dialog" aria-labelledby="editTaskLabel" aria-hidden="true"> <div class="modal-dialog modal-lg" role="document"> <div class="modal-content"> <div class="modal-header"> <h5 class="modal-title" id="editTaskLabel">Edit task</h5> <button type="button" class="close btn-close" data-bs-dismiss="modal" aria-label="Close"> <span aria-hidden="true">&times;</span> </button> </div> <div class="modal-body"> <form action="" method="post" enctype="multipart/form-data"> <input type="hidden" name="csrfmiddlewaretoken" value="pSLVgvfNJEfxbF4IcCGRiPPRhsTarcv4SmAhmKsfF3AkfgGRELzwScFzlbYwKu9O"> <div id="div_id_task_name" class="form-group"> <label for="id_task_name" class="col-form-label requiredField"> Task name:<span class="asteriskField">*</span> </label> <div class=""> <input type="text" name="task_name" value="Video Generation" maxlength="200" class="textinput textInput form-control" required="" id="id_task_name" readonly > </div> </div> <div id="div_id_task_area" class="form-group"> <label for="id_task_area" class=" requiredField"> Top-level area:<span class="asteriskField">*</span> </label> <div class=""> <select name="task_area" class="select form-control" required id="id_task_area"> <option value="">---------</option> <option value="17">Adversarial</option> <option value="18">Audio</option> <option value="11">Computer Code</option> <option value="3" selected>Computer Vision</option> <option value="9">Graphs</option> <option value="15">Knowledge Base</option> <option value="7">Medical</option> <option value="6">Methodology</option> <option value="5">Miscellaneous</option> <option value="12">Music</option> <option value="4">Natural Language Processing</option> <option value="13">Playing Games</option> <option value="14">Reasoning</option> <option value="16">Robots</option> <option value="10">Speech</option> <option value="8">Time Series</option> </select> </div> </div> <div id="div_id_task_parent" class="form-group"> <label for="id_task_parent" class=""> Parent task (if any): </label> <div class=""> <select name="task_parent" class="modelselect2 form-control" id="id_task_parent" data-autocomplete-light-language="en" data-autocomplete-light-url="/tag-autocomplete/" data-autocomplete-light-function="select2"> <option value="">---------</option> <option value="913" selected>Video</option> </select> </div> </div> <div id="div_id_description" class="form-group"> <label for="id_description" class=""> Description with markdown (optional): </label> <div class=""> <textarea name="description" cols="40" rows="3" class="textarea form-control" id="id_description"> &lt;span style=&quot;color:grey; opacity: 0.6&quot;&gt;( Various Video Generation Tasks. Gif credit: [MaGViT](https://paperswithcode.com/paper/magvit-masked-generative-video-transformer) )&lt;/span&gt;</textarea> </div> </div> <div id="div_id_image" class="form-group"> <label for="id_image" class=""> Image </label> <div class=""> Currently: <a href="https://production-media.paperswithcode.com/tasks/fae9be37-f327-44c5-b788-312c64aefef6.gif">tasks/fae9be37-f327-44c5-b788-312c64aefef6.gif</a> <input type="checkbox" name="image-clear" id="image-clear_id"> <label for="image-clear_id">Clear</label><br> Change: <input type="file" name="image" accept="image/*" class="clearablefileinput form-control-file" id="id_image"> </div> </div> <div class="modal-footer"> <button type="submit" class="btn btn-primary"> Submit </button> </div> </form> </div> </div> </div> </div> <!-- Add Row --> <div class="modal fade" id="addRow" role="dialog" aria-labelledby="addRowLabel" aria-hidden="true"> <div class="modal-dialog" role="document"> <div class="modal-content"> <div class="modal-header"> <h5 class="modal-title" id="addRowLabel">Add a new evaluation result row</h5> <button type="button" class="close btn-close" data-bs-dismiss="modal" aria-label="Close"> <span aria-hidden="true">&times;</span> </button> </div> <form action="" method="post"> <div class="modal-body"> <input type="hidden" name="csrfmiddlewaretoken" value="pSLVgvfNJEfxbF4IcCGRiPPRhsTarcv4SmAhmKsfF3AkfgGRELzwScFzlbYwKu9O"> <input id="id_task" disabled="disabled" type="hidden" value="534"/> <div id="div_id_paper" class="form-group"> <label for="id_paper" class=" requiredField"> Paper title:<span class="asteriskField">*</span> </label> <div class=""> <select name="paper" class="modelselect2 form-control" required id="id_paper" data-autocomplete-light-language="en" data-autocomplete-light-url="/paper-autocomplete/" data-autocomplete-light-function="select2"> <option value="" selected>---------</option> </select> </div> </div> <div id="div_id_dataset" class="form-group"> <label for="id_dataset" class=" requiredField"> Dataset:<span class="asteriskField">*</span> </label> <div class=""> <select name="dataset" class="modelselect2 form-control" required id="id_dataset" data-autocomplete-light-language="en" data-autocomplete-light-url="/dataset-autocomplete/" data-autocomplete-light-function="select2"> <option value="" selected>---------</option> </select> </div> </div> <div id="div_id_model_name" class="form-group"> <label for="id_model_name" class=" requiredField"> Model name:<span class="asteriskField">*</span> </label> <div class=""> <input type="text" name="model_name" class="textinput textInput form-control" required id="id_model_name"> </div> </div> <div id="div_id_metric" class="form-group"> <label for="id_metric" class=" requiredField"> Metric name:<span class="asteriskField">*</span> </label> <div class=""> <select name="metric" class="modelselect2 form-control" required id="id_metric" data-autocomplete-light-language="en" data-autocomplete-light-url="/metric-autocomplete/" data-autocomplete-light-function="select2"> <option value="" selected>---------</option> </select> </div> </div> <div id="sota-metric-names"> </div> <div class="form-group"> <div id="div_id_metric_higher_is_better" class="form-check"> <input type="checkbox" name="metric_higher_is_better" class="checkboxinput form-check-input" id="id_metric_higher_is_better"> <label for="id_metric_higher_is_better" class="form-check-label"> Higher is better (for the metric) </label> </div> </div> <div id="div_id_metric_value" class="form-group"> <label for="id_metric_value" class=" requiredField"> Metric value:<span class="asteriskField">*</span> </label> <div class=""> <input type="text" name="metric_value" class="textinput textInput form-control" required id="id_metric_value"> </div> </div> <div id="sota-metric-values"> </div> <div class="form-group"> <div id="div_id_uses_additional_data" class="form-check"> <input type="checkbox" name="uses_additional_data" class="checkboxinput form-check-input" id="id_uses_additional_data"> <label for="id_uses_additional_data" class="form-check-label"> Uses extra training data </label> </div> </div> <div id="div_id_evaluated_on" class="form-group"> <label for="id_evaluated_on" class=""> Data evaluated on </label> <div class=""> <input type="text" name="evaluated_on" autocomplete="off" class="dateinput form-control" id="id_evaluated_on"> </div> </div> </div> <div class="modal-footer"> <button type="submit" class="btn btn-primary">Submit </button> </div> </form> </div> </div> </div> </div> <div class="container content content-buffer "> <main> <div class="row task-content" style="margin-top: 3rem;"> <!-- Task Header --> <div class="dataset-header"> <a href="/area/computer-vision"> <span class="badge badge-primary"> <span class=" icon-wrapper icon-fa icon-fa-solid" data-name="images"><svg viewBox="0 0 576 514.999" xmlns="http://www.w3.org/2000/svg"><path d="M480 417.998v16c0 26.51-21.49 48-48 48H48c-26.51 0-48-21.49-48-48v-256c0-26.51 21.49-48 48-48h16v208c0 44.113 35.888 80 80 80h336zm96-80c0 26.51-21.49 48-48 48H144c-26.51 0-48-21.49-48-48v-256c0-26.51 21.49-48 48-48h384c26.51 0 48 21.49 48 48v256zm-320-208c0-26.51-21.49-48-48-48s-48 21.49-48 48 21.49 48 48 48 48-21.49 48-48zm-96 144v48h352v-112l-87.514-87.514c-4.687-4.687-12.285-4.687-16.971 0L272 257.999l-39.514-39.515c-4.688-4.686-12.285-4.686-16.972 0z"/></svg></span> <span>Computer Vision</span> </span> </a> </div> <div class="artefact-header"> <div class="float-right task-edit">  <div class="dropdown edit-button"> <a data-bs-toggle="modal" data-bs-target="#loginModal"> <span class="badge badge-method-edit" style="padding-top:10px;"><span class=" icon-wrapper icon-fa icon-fa-solid" data-name="edit"><svg viewBox="0 0 576 514.999" xmlns="http://www.w3.org/2000/svg"><path d="M402.6 85.198l90.2 90.2c3.8 3.8 3.8 10 0 13.8l-218.399 218.4-92.8 10.3c-12.4 1.4-22.9-9.1-21.5-21.5l10.3-92.8 218.4-218.4c3.799-3.8 10-3.8 13.799 0zm162-22.9c15.2 15.2 15.2 39.9 0 55.2l-35.4 35.4c-3.8 3.8-10 3.8-13.8 0l-90.2-90.2c-3.8-3.8-3.8-10 0-13.8l35.4-35.4c15.3-15.2 40-15.2 55.2 0zM384 348.198c0-3.2 1.3-6.2 3.5-8.5l40-40c7.6-7.5 20.5-2.2 20.5 8.5v157.8c0 26.5-21.5 48-48 48H48c-26.5 0-48-21.5-48-48v-352c0-26.5 21.5-48 48-48h285.8c10.7 0 16.1 12.9 8.5 20.5l-40 40c-2.3 2.2-5.3 3.5-8.5 3.5H64v320h320v-101.8z"/></svg></span> Edit</span> </a> </div> </div> <h1 id="task-home">Video Generation</h1> <div class="artefact-information"> <p> 378 papers with code • 15 benchmarks • 15 datasets </p> </div> </div> <div class="col-lg-9"> <!--Task Desc--> <div class="description"> <div class="description-content"> <p><span style="color: grey;">( Various Video Generation Tasks. Gif credit: <a href="https://paperswithcode.com/paper/magvit-masked-generative-video-transformer">MaGViT</a> )</span></p> </div> </div> <!-- Mobile image --> <div class="image-container task-image-mobile"> <a href="https://production-media.paperswithcode.com/thumbnails/task/11ba3d1a-5ca7-459a-a0dd-658050e2c75b.gif" data-lightbox="imageresource"> <img id="imageresource" width=100% src="https://production-media.paperswithcode.com/thumbnails/task/11ba3d1a-5ca7-459a-a0dd-658050e2c75b.gif"> </a> </div> <!-- Task Benchmarks --> <div class="task-benchmarks"> <div id="benchmarks" class="collapsed"> <div class="title"> <h2 id="benchmarks">Benchmarks <div class="float-right"> <div class="dropdown edit-button task-add-a-result"> <a data-bs-toggle="modal" data-bs-target="#loginModal"> <span class="badge badge-primary" style="font-size:12px;"> Add a Result</span> </a> </div> </div> </h2> These leaderboards are used to track progress in Video Generation <hr> </div> <div class="sota-table-preview table-responsive"> <table id="benchmarksTable" class="table-striped table-responsive"> <thead> <tr> <th>Trend</th> <th style="padding-left:12px;">Dataset</th> <th style="min-width:200px">Best Model</th> <!-- <th style="width:38%">Paper Title</th> --> <th class="text-center">Paper</th> <th class="text-center">Code</th> <th class="text-center">Compare</th> </tr> </thead> <tbody> <tr onclick="window.location='/sota/video-generation-on-ucf-101';"> <td> <a href="/sota/video-generation-on-ucf-101"> <img class="sota-thumb" src="https://production-media.paperswithcode.com/sota-thumbs/video-generation-on-ucf-101-small_01479dad.png"/> </a> </td> <td> <div class="dataset black-links"> <a href="/sota/video-generation-on-ucf-101"> UCF-101 </a> </div> </td> <td> <div class="black-links"> <a href="/sota/video-generation-on-ucf-101"> <i class="em em-trophy" style="height:1em;position:relative;top:-2px"></i> W.A.L.T-XL (class-conditional) </a> </div> </td> <!-- <td> <div class="paper blue-links"> <a href="/sota/video-generation-on-ucf-101">Photorealistic Video Generation with Diffusion Models</a> </div> </td> --> <td> <div class="text-center paper"> <a href="/paper/photorealistic-video-generation-with"> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> </a> </div> </td> <td> </td> <td class="text-center"> <div class="sota-table-link"> <a href="/sota/video-generation-on-ucf-101" class="btn btn-primary">See&nbsp;all</a> </div> </td> </tr> <tr onclick="window.location='/sota/video-generation-on-bair-robot-pushing';"> <td> <a href="/sota/video-generation-on-bair-robot-pushing"> <img class="sota-thumb" src="https://production-media.paperswithcode.com/sota-thumbs/video-generation-on-bair-robot-pushing-small_849bbef9.png"/> </a> </td> <td> <div class="dataset black-links"> <a href="/sota/video-generation-on-bair-robot-pushing"> BAIR Robot Pushing </a> </div> </td> <td> <div class="black-links"> <a href="/sota/video-generation-on-bair-robot-pushing"> <i class="em em-trophy" style="height:1em;position:relative;top:-2px"></i> MAGVIT </a> </div> </td> <!-- <td> <div class="paper blue-links"> <a href="/sota/video-generation-on-bair-robot-pushing">MAGVIT: Masked Generative Video Transformer</a> </div> </td> --> <td> <div class="text-center paper"> <a href="/paper/magvit-masked-generative-video-transformer"> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> </a> </div> </td> <td> <div class="text-center github"><a href="/paper/magvit-masked-generative-video-transformer#code"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> </a></div> </td> <td class="text-center"> <div class="sota-table-link"> <a href="/sota/video-generation-on-bair-robot-pushing" class="btn btn-primary">See&nbsp;all</a> </div> </td> </tr> <tr onclick="window.location='/sota/video-generation-on-sky-time-lapse';"> <td> <a href="/sota/video-generation-on-sky-time-lapse"> <img class="sota-thumb" src="https://production-media.paperswithcode.com/sota-thumbs/video-generation-on-sky-time-lapse-small_0ab45024.png"/> </a> </td> <td> <div class="dataset black-links"> <a href="/sota/video-generation-on-sky-time-lapse"> Sky Time-lapse </a> </div> </td> <td> <div class="black-links"> <a href="/sota/video-generation-on-sky-time-lapse"> <i class="em em-trophy" style="height:1em;position:relative;top:-2px"></i> StyleSV (256x256) </a> </div> </td> <!-- <td> <div class="paper blue-links"> <a href="/sota/video-generation-on-sky-time-lapse">Towards Smooth Video Composition</a> </div> </td> --> <td> <div class="text-center paper"> <a href="/paper/towards-smooth-video-composition"> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> </a> </div> </td> <td> <div class="text-center github"><a href="/paper/towards-smooth-video-composition#code"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> </a></div> </td> <td class="text-center"> <div class="sota-table-link"> <a href="/sota/video-generation-on-sky-time-lapse" class="btn btn-primary">See&nbsp;all</a> </div> </td> </tr> <tr onclick="window.location='/sota/video-generation-on-ucf-101-16-frames-64x64';"> <td> <a href="/sota/video-generation-on-ucf-101-16-frames-64x64"> <img class="sota-thumb" src="https://production-media.paperswithcode.com/sota-thumbs/video-generation-on-ucf-101-16-frames-64x64-small_3ec5a02a.png"/> </a> </td> <td> <div class="dataset black-links"> <a href="/sota/video-generation-on-ucf-101-16-frames-64x64"> UCF-101 16 frames, 64x64, Unconditional </a> </div> </td> <td> <div class="black-links"> <a href="/sota/video-generation-on-ucf-101-16-frames-64x64"> <i class="em em-trophy" style="height:1em;position:relative;top:-2px"></i> Make-A-Video (ours) vs. CogVideo (Chinese) </a> </div> </td> <!-- <td> <div class="paper blue-links"> <a href="/sota/video-generation-on-ucf-101-16-frames-64x64">Make-A-Video: Text-to-Video Generation without Text-Video Data</a> </div> </td> --> <td> <div class="text-center paper"> <a href="/paper/make-a-video-text-to-video-generation-without"> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> </a> </div> </td> <td> <div class="text-center github"><a href="/paper/make-a-video-text-to-video-generation-without#code"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> </a></div> </td> <td class="text-center"> <div class="sota-table-link"> <a href="/sota/video-generation-on-ucf-101-16-frames-64x64" class="btn btn-primary">See&nbsp;all</a> </div> </td> </tr> <tr onclick="window.location='/sota/video-generation-on-ucf-101-16-frames';"> <td> <a href="/sota/video-generation-on-ucf-101-16-frames"> <img class="sota-thumb" src="https://production-media.paperswithcode.com/sota-thumbs/video-generation-on-ucf-101-16-frames-small_9469e800.png"/> </a> </td> <td> <div class="dataset black-links"> <a href="/sota/video-generation-on-ucf-101-16-frames"> UCF-101 16 frames, Unconditional, Single GPU </a> </div> </td> <td> <div class="black-links"> <a href="/sota/video-generation-on-ucf-101-16-frames"> <i class="em em-trophy" style="height:1em;position:relative;top:-2px"></i> TGAN-F </a> </div> </td> <!-- <td> <div class="paper blue-links"> <a href="/sota/video-generation-on-ucf-101-16-frames">Lower Dimensional Kernels for Video Discriminators</a> </div> </td> --> <td> <div class="text-center paper"> <a href="/paper/lower-dimensional-kernels-for-video"> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> </a> </div> </td> <td> <div class="text-center github"><a href="/paper/lower-dimensional-kernels-for-video#code"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> </a></div> </td> <td class="text-center"> <div class="sota-table-link"> <a href="/sota/video-generation-on-ucf-101-16-frames" class="btn btn-primary">See&nbsp;all</a> </div> </td> </tr> <tr onclick="window.location='/sota/video-generation-on-laion-400m';"> <td> <a href="/sota/video-generation-on-laion-400m"> <img class="sota-thumb" src="https://production-media.paperswithcode.com/sota-thumbs/video-generation-on-laion-400m-small_ce842df0.png"/> </a> </td> <td> <div class="dataset black-links"> <a href="/sota/video-generation-on-laion-400m"> LAION-400M </a> </div> </td> <td> <div class="black-links"> <a href="/sota/video-generation-on-laion-400m"> <i class="em em-trophy" style="height:1em;position:relative;top:-2px"></i> Imagen original (constant=6) </a> </div> </td> <!-- <td> <div class="paper blue-links"> <a href="/sota/video-generation-on-laion-400m">Imagen Video: High Definition Video Generation with Diffusion Models</a> </div> </td> --> <td> <div class="text-center paper"> <a href="/paper/imagen-video-high-definition-video-generation"> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> </a> </div> </td> <td> </td> <td class="text-center"> <div class="sota-table-link"> <a href="/sota/video-generation-on-laion-400m" class="btn btn-primary">See&nbsp;all</a> </div> </td> </tr> <tr onclick="window.location='/sota/video-generation-on-taichi';"> <td> <a href="/sota/video-generation-on-taichi"> <img class="sota-thumb" src="https://production-media.paperswithcode.com/sota-thumbs/video-generation-on-taichi-small_1813a06e.png"/> </a> </td> <td> <div class="dataset black-links"> <a href="/sota/video-generation-on-taichi"> Taichi </a> </div> </td> <td> <div class="black-links"> <a href="/sota/video-generation-on-taichi"> <i class="em em-trophy" style="height:1em;position:relative;top:-2px"></i> StyleSV (256x256) </a> </div> </td> <!-- <td> <div class="paper blue-links"> <a href="/sota/video-generation-on-taichi">Towards Smooth Video Composition</a> </div> </td> --> <td> <div class="text-center paper"> <a href="/paper/towards-smooth-video-composition"> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> </a> </div> </td> <td> <div class="text-center github"><a href="/paper/towards-smooth-video-composition#code"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> </a></div> </td> <td class="text-center"> <div class="sota-table-link"> <a href="/sota/video-generation-on-taichi" class="btn btn-primary">See&nbsp;all</a> </div> </td> </tr> <tr onclick="window.location='/sota/video-generation-on-ucf-101-16-frames-128x128';"> <td> <a href="/sota/video-generation-on-ucf-101-16-frames-128x128"> <img class="sota-thumb" src="https://production-media.paperswithcode.com/sota-thumbs/video-generation-on-ucf-101-16-frames-128x128-small_f5bc8593.png"/> </a> </td> <td> <div class="dataset black-links"> <a href="/sota/video-generation-on-ucf-101-16-frames-128x128"> UCF-101 16 frames, 128x128, Unconditional </a> </div> </td> <td> <div class="black-links"> <a href="/sota/video-generation-on-ucf-101-16-frames-128x128"> <i class="em em-trophy" style="height:1em;position:relative;top:-2px"></i> TGANv2 (2020) </a> </div> </td> <!-- <td> <div class="paper blue-links"> <a href="/sota/video-generation-on-ucf-101-16-frames-128x128">Train Sparsely, Generate Densely: Memory-efficient Unsupervised Training of High-resolution Temporal GAN</a> </div> </td> --> <td> <div class="text-center paper"> <a href="/paper/tganv2-efficient-training-of-large-models-for"> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> </a> </div> </td> <td> <div class="text-center github"><a href="/paper/tganv2-efficient-training-of-large-models-for#code"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> </a></div> </td> <td class="text-center"> <div class="sota-table-link"> <a href="/sota/video-generation-on-ucf-101-16-frames-128x128" class="btn btn-primary">See&nbsp;all</a> </div> </td> </tr> <tr onclick="window.location='/sota/video-generation-on-kinetics-600-12-frames';"> <td> <a href="/sota/video-generation-on-kinetics-600-12-frames"> <img class="sota-thumb" src="https://production-media.paperswithcode.com/sota-thumbs/video-generation-on-kinetics-600-12-frames-small_b775e875.png"/> </a> </td> <td> <div class="dataset black-links"> <a href="/sota/video-generation-on-kinetics-600-12-frames"> Kinetics-600 12 frames, 64x64 </a> </div> </td> <td> <div class="black-links"> <a href="/sota/video-generation-on-kinetics-600-12-frames"> <i class="em em-trophy" style="height:1em;position:relative;top:-2px"></i> W.A.L.T-L </a> </div> </td> <!-- <td> <div class="paper blue-links"> <a href="/sota/video-generation-on-kinetics-600-12-frames">Photorealistic Video Generation with Diffusion Models</a> </div> </td> --> <td> <div class="text-center paper"> <a href="/paper/photorealistic-video-generation-with"> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> </a> </div> </td> <td> </td> <td class="text-center"> <div class="sota-table-link"> <a href="/sota/video-generation-on-kinetics-600-12-frames" class="btn btn-primary">See&nbsp;all</a> </div> </td> </tr> <tr onclick="window.location='/sota/video-generation-on-trailerfaces';"> <td> <a href="/sota/video-generation-on-trailerfaces"> <img class="sota-thumb" src="https://production-media.paperswithcode.com/sota-thumbs/video-generation-on-trailerfaces-small_aff840e2.png"/> </a> </td> <td> <div class="dataset black-links"> <a href="/sota/video-generation-on-trailerfaces"> TrailerFaces </a> </div> </td> <td> <div class="black-links"> <a href="/sota/video-generation-on-trailerfaces"> <i class="em em-trophy" style="height:1em;position:relative;top:-2px"></i> PG-SWGAN-3D </a> </div> </td> <!-- <td> <div class="paper blue-links"> <a href="/sota/video-generation-on-trailerfaces">Sliced Wasserstein Generative Models</a> </div> </td> --> <td> <div class="text-center paper"> <a href="/paper/sliced-wasserstein-generative-models-1"> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> </a> </div> </td> <td> <div class="text-center github"><a href="/paper/sliced-wasserstein-generative-models-1#code"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> </a></div> </td> <td class="text-center"> <div class="sota-table-link"> <a href="/sota/video-generation-on-trailerfaces" class="btn btn-primary">See&nbsp;all</a> </div> </td> </tr> <tr onclick="window.location='/sota/video-generation-on-kinetics-600-48-frames';"> <td> <a href="/sota/video-generation-on-kinetics-600-48-frames"> <img class="sota-thumb" src="https://production-media.paperswithcode.com/sota-thumbs/video-generation-on-kinetics-600-48-frames-small_cdbcb3ec.png"/> </a> </td> <td> <div class="dataset black-links"> <a href="/sota/video-generation-on-kinetics-600-48-frames"> Kinetics-600 48 frames, 64x64 </a> </div> </td> <td> <div class="black-links"> <a href="/sota/video-generation-on-kinetics-600-48-frames"> <i class="em em-trophy" style="height:1em;position:relative;top:-2px"></i> DVD-GAN </a> </div> </td> <!-- <td> <div class="paper blue-links"> <a href="/sota/video-generation-on-kinetics-600-48-frames">Adversarial Video Generation on Complex Datasets</a> </div> </td> --> <td> <div class="text-center paper"> <a href="/paper/efficient-video-generation-on-complex"> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> </a> </div> </td> <td> <div class="text-center github"><a href="/paper/efficient-video-generation-on-complex#code"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> </a></div> </td> <td class="text-center"> <div class="sota-table-link"> <a href="/sota/video-generation-on-kinetics-600-48-frames" class="btn btn-primary">See&nbsp;all</a> </div> </td> </tr> <tr onclick="window.location='/sota/video-generation-on-kinetics-600-12-frames-1';"> <td> <a href="/sota/video-generation-on-kinetics-600-12-frames-1"> <img class="sota-thumb" src="https://production-media.paperswithcode.com/sota-thumbs/video-generation-on-kinetics-600-12-frames-1-small_b000ed32.png"/> </a> </td> <td> <div class="dataset black-links"> <a href="/sota/video-generation-on-kinetics-600-12-frames-1"> Kinetics-600 12 frames, 128x128 </a> </div> </td> <td> <div class="black-links"> <a href="/sota/video-generation-on-kinetics-600-12-frames-1"> <i class="em em-trophy" style="height:1em;position:relative;top:-2px"></i> DVD-GAN </a> </div> </td> <!-- <td> <div class="paper blue-links"> <a href="/sota/video-generation-on-kinetics-600-12-frames-1">Adversarial Video Generation on Complex Datasets</a> </div> </td> --> <td> <div class="text-center paper"> <a href="/paper/efficient-video-generation-on-complex"> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> </a> </div> </td> <td> <div class="text-center github"><a href="/paper/efficient-video-generation-on-complex#code"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> </a></div> </td> <td class="text-center"> <div class="sota-table-link"> <a href="/sota/video-generation-on-kinetics-600-12-frames-1" class="btn btn-primary">See&nbsp;all</a> </div> </td> </tr> <tr onclick="window.location='/sota/video-generation-on-how2sign';"> <td> <a href="/sota/video-generation-on-how2sign"> <img class="sota-thumb" src="https://production-media.paperswithcode.com/sota-thumbs/video-generation-on-how2sign-small_b0a8caec.png"/> </a> </td> <td> <div class="dataset black-links"> <a href="/sota/video-generation-on-how2sign"> How2Sign </a> </div> </td> <td> <div class="black-links"> <a href="/sota/video-generation-on-how2sign"> <i class="em em-trophy" style="height:1em;position:relative;top:-2px"></i> INR-V </a> </div> </td> <!-- <td> <div class="paper blue-links"> <a href="/sota/video-generation-on-how2sign">INR-V: A Continuous Representation Space for Video-based Generative Tasks</a> </div> </td> --> <td> <div class="text-center paper"> <a href="/paper/inr-v-a-continuous-representation-space-for"> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> </a> </div> </td> <td> <div class="text-center github"><a href="/paper/inr-v-a-continuous-representation-space-for#code"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> </a></div> </td> <td class="text-center"> <div class="sota-table-link"> <a href="/sota/video-generation-on-how2sign" class="btn btn-primary">See&nbsp;all</a> </div> </td> </tr> <tr onclick="window.location='/sota/video-generation-on-youtube-driving';"> <td> <a href="/sota/video-generation-on-youtube-driving"> <img class="sota-thumb" src="https://production-media.paperswithcode.com/sota-thumbs/video-generation-on-youtube-driving-small_3a7811c4.png"/> </a> </td> <td> <div class="dataset black-links"> <a href="/sota/video-generation-on-youtube-driving"> YouTube Driving </a> </div> </td> <td> <div class="black-links"> <a href="/sota/video-generation-on-youtube-driving"> <i class="em em-trophy" style="height:1em;position:relative;top:-2px"></i> StyleSV </a> </div> </td> <!-- <td> <div class="paper blue-links"> <a href="/sota/video-generation-on-youtube-driving">Towards Smooth Video Composition</a> </div> </td> --> <td> <div class="text-center paper"> <a href="/paper/towards-smooth-video-composition"> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> </a> </div> </td> <td> <div class="text-center github"><a href="/paper/towards-smooth-video-composition#code"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> </a></div> </td> <td class="text-center"> <div class="sota-table-link"> <a href="/sota/video-generation-on-youtube-driving" class="btn btn-primary">See&nbsp;all</a> </div> </td> </tr> <tr onclick="window.location='/sota/video-generation-on-msr-vtt';"> <td> <a href="/sota/video-generation-on-msr-vtt"> <img class="sota-thumb" src="https://production-media.paperswithcode.com/sota-thumbs/video-generation-on-msr-vtt-small_0343dc14.png"/> </a> </td> <td> <div class="dataset black-links"> <a href="/sota/video-generation-on-msr-vtt"> MSR-VTT </a> </div> </td> <td> <div class="black-links"> <a href="/sota/video-generation-on-msr-vtt"> <i class="em em-trophy" style="height:1em;position:relative;top:-2px"></i> VideoAssembler (Zero-Shot, 256x256, class-conditional) </a> </div> </td> <!-- <td> <div class="paper blue-links"> <a href="/sota/video-generation-on-msr-vtt">MagDiff: Multi-Alignment Diffusion for High-Fidelity Video Generation and Editing</a> </div> </td> --> <td> <div class="text-center paper"> <a href="/paper/videoassembler-identity-consistent-video"> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> </a> </div> </td> <td> <div class="text-center github"><a href="/paper/videoassembler-identity-consistent-video#code"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> </a></div> </td> <td class="text-center"> <div class="sota-table-link"> <a href="/sota/video-generation-on-msr-vtt" class="btn btn-primary">See&nbsp;all</a> </div> </td> </tr> </tbody> </table> <div class="table-options expand"> <a href="javascript:void(0)" onclick="document.getElementById('benchmarks').classList.remove('collapsed')" >Show all 15 benchmarks</a> </div> <div class="table-options collapse"> <a href="javascript:void(0)" onclick="document.getElementById('benchmarks').classList.add('collapsed')" >Collapse benchmarks</a> </div> </div> </div> </div> <!-- Libraries --> <div class="task-started"> <div class="title task-libraries"> <h2 id="task-libraries">Libraries <span class="lib-info" data-bs-toggle="popover" data-bs-placement="top" data-bs-trigger="hover" data-bs-title="Libraries" data-bs-content="These libraries are updated daily, based on the papers assigned to this task. If you think a Library is missing, make sure this library is added as code to the papers it implements, and that the papers have been assigned to this task." ><span class=" icon-wrapper icon-ion" data-name="information-circle-outline"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M248 64C146.39 64 64 146.39 64 248s82.39 184 184 184 184-82.39 184-184S349.61 64 248 64z" fill="none" stroke="#000" stroke-miterlimit="10" stroke-width="32"/><path fill="none" stroke="#000" stroke-linecap="round" stroke-linejoin="round" stroke-width="32" d="M220 220h32v116"/><path fill="none" stroke="#000" stroke-linecap="round" stroke-miterlimit="10" stroke-width="32" d="M208 340h88"/><path d="M248 130a26 26 0 1 0 26 26 26 26 0 0 0-26-26z"/></svg></span></span> </h2> Use these libraries to find Video Generation models and implementations <hr> <div id="libraries-short-list"> <div class="row task-library"> <div class="col-12 col-md-6"> <a href="https://github.com/stability-ai/generative-models" onclick="captureOutboundLink('https://github.com/stability-ai/generative-models'); return true;"> <div class="library-logo"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> </div> stability-ai/generative-models </a> </div> <div class="col-6 col-md-3"> <span class="task-library-pwc-count"> 2 papers </span> </div> <div class="col-6 col-md-3"> <div class="library-stars text-nowrap"> 24,717 <span class=" icon-wrapper icon-ion" data-name="star"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M394 480a16 16 0 0 1-9.39-3L256 383.76 127.39 477a16 16 0 0 1-24.55-18.08L153 310.35 23 221.2a16 16 0 0 1 9-29.2h160.38l48.4-148.95a16 16 0 0 1 30.44 0l48.4 149H480a16 16 0 0 1 9.05 29.2L359 310.35l50.13 148.53A16 16 0 0 1 394 480z"/></svg></span> </div> </div> </div> <div class="row task-library"> <div class="col-12 col-md-6"> <a href="https://github.com/NUS-HPC-AI-Lab/VideoSys" onclick="captureOutboundLink('https://github.com/NUS-HPC-AI-Lab/VideoSys'); return true;"> <div class="library-logo"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> </div> NUS-HPC-AI-Lab/VideoSys </a> </div> <div class="col-6 col-md-3"> <span class="task-library-pwc-count"> 2 papers </span> </div> <div class="col-6 col-md-3"> <div class="library-stars text-nowrap"> 1,783 <span class=" icon-wrapper icon-ion" data-name="star"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M394 480a16 16 0 0 1-9.39-3L256 383.76 127.39 477a16 16 0 0 1-24.55-18.08L153 310.35 23 221.2a16 16 0 0 1 9-29.2h160.38l48.4-148.95a16 16 0 0 1 30.44 0l48.4 149H480a16 16 0 0 1 9.05 29.2L359 310.35l50.13 148.53A16 16 0 0 1 394 480z"/></svg></span> </div> </div> </div> <div class="row task-library"> <div class="col-12 col-md-6"> <a href="https://github.com/nvlabs/long-video-gan" onclick="captureOutboundLink('https://github.com/nvlabs/long-video-gan'); return true;"> <div class="library-logo"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> </div> nvlabs/long-video-gan </a> </div> <div class="col-6 col-md-3"> <span class="task-library-pwc-count"> 2 papers </span> </div> <div class="col-6 col-md-3"> <div class="library-stars text-nowrap"> 317 <span class=" icon-wrapper icon-ion" data-name="star"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M394 480a16 16 0 0 1-9.39-3L256 383.76 127.39 477a16 16 0 0 1-24.55-18.08L153 310.35 23 221.2a16 16 0 0 1 9-29.2h160.38l48.4-148.95a16 16 0 0 1 30.44 0l48.4 149H480a16 16 0 0 1 9.05 29.2L359 310.35l50.13 148.53A16 16 0 0 1 394 480z"/></svg></span> </div> </div> </div> </div> <div id="libraries-full-list" style="display:none"> <div class="row task-library"> <div class="col-12 col-md-6"> <a href="https://github.com/stability-ai/generative-models" onclick="captureOutboundLink('https://github.com/stability-ai/generative-models'); return true;"> <div class="library-logo"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> </div> stability-ai/generative-models </a> </div> <div class="col-6 col-md-3"> <span class="task-library-pwc-count"> 2 papers </span> </div> <div class="col-6 col-md-3"> <div class="library-stars text-nowrap"> 24,717 <span class=" icon-wrapper icon-ion" data-name="star"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M394 480a16 16 0 0 1-9.39-3L256 383.76 127.39 477a16 16 0 0 1-24.55-18.08L153 310.35 23 221.2a16 16 0 0 1 9-29.2h160.38l48.4-148.95a16 16 0 0 1 30.44 0l48.4 149H480a16 16 0 0 1 9.05 29.2L359 310.35l50.13 148.53A16 16 0 0 1 394 480z"/></svg></span> </div> </div> </div> <div class="row task-library"> <div class="col-12 col-md-6"> <a href="https://github.com/NUS-HPC-AI-Lab/VideoSys" onclick="captureOutboundLink('https://github.com/NUS-HPC-AI-Lab/VideoSys'); return true;"> <div class="library-logo"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> </div> NUS-HPC-AI-Lab/VideoSys </a> </div> <div class="col-6 col-md-3"> <span class="task-library-pwc-count"> 2 papers </span> </div> <div class="col-6 col-md-3"> <div class="library-stars text-nowrap"> 1,783 <span class=" icon-wrapper icon-ion" data-name="star"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M394 480a16 16 0 0 1-9.39-3L256 383.76 127.39 477a16 16 0 0 1-24.55-18.08L153 310.35 23 221.2a16 16 0 0 1 9-29.2h160.38l48.4-148.95a16 16 0 0 1 30.44 0l48.4 149H480a16 16 0 0 1 9.05 29.2L359 310.35l50.13 148.53A16 16 0 0 1 394 480z"/></svg></span> </div> </div> </div> <div class="row task-library"> <div class="col-12 col-md-6"> <a href="https://github.com/nvlabs/long-video-gan" onclick="captureOutboundLink('https://github.com/nvlabs/long-video-gan'); return true;"> <div class="library-logo"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> </div> nvlabs/long-video-gan </a> </div> <div class="col-6 col-md-3"> <span class="task-library-pwc-count"> 2 papers </span> </div> <div class="col-6 col-md-3"> <div class="library-stars text-nowrap"> 317 <span class=" icon-wrapper icon-ion" data-name="star"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M394 480a16 16 0 0 1-9.39-3L256 383.76 127.39 477a16 16 0 0 1-24.55-18.08L153 310.35 23 221.2a16 16 0 0 1 9-29.2h160.38l48.4-148.95a16 16 0 0 1 30.44 0l48.4 149H480a16 16 0 0 1 9.05 29.2L359 310.35l50.13 148.53A16 16 0 0 1 394 480z"/></svg></span> </div> </div> </div> </div> </div> </div> <!-- Task Datasets --> <div class="title"> <h2 id="datasets">Datasets</h2> <hr> <div class="task-datasets"> <div class="col-md-12"> <ul class="list-unstyled"> <li> <a href="/dataset/ucf101"> <span class="badge badge-primary"> <img src="https://production-media.paperswithcode.com/thumbnails/dataset/dataset-0000000066-91ee6b2c_rLkoGNp.jpg"> UCF101 </span> </a> </li> <li> <a href="/dataset/kinetics"> <span class="badge badge-primary"> <img src="https://production-media.paperswithcode.com/thumbnails/dataset/dataset-0000000346-272f35cf_HBiP1jT.jpg"> Kinetics </span> </a> </li> <li> <a href="/dataset/msr-vtt"> <span class="badge badge-primary"> <img src="https://production-media.paperswithcode.com/thumbnails/dataset/dataset-0000001108-a5f3eefc_8y8tYJ7.jpg"> MSR-VTT </span> </a> </li> <li> <a href="/dataset/webvid"> <span class="badge badge-primary"> <img src="https://production-media.paperswithcode.com/thumbnails/dataset/dataset-0000007791-e0334b08.jpg"> WebVid </span> </a> </li> <li> <a href="/dataset/laion-400m"> <span class="badge badge-primary"> <img src="https://production-media.paperswithcode.com/thumbnails/dataset/8c0ebdd4-575c-4ac0-97a1-4756273c8eff.jpg"> LAION-400M </span> </a> </li> <li> <a href="/dataset/kinetics-600"> <span class="badge badge-primary"> <img src="https://production-media.paperswithcode.com/thumbnails/dataset/dataset-0000002041-272f35cf_UfDo0gD.jpg"> Kinetics-600 </span> </a> </li> <li> <a href="/dataset/how2sign"> <span class="badge badge-primary"> <img src="https://production-media.paperswithcode.com/thumbnails/dataset/dataset-0000006660-f3f0d984_KJELNgv.jpg"> How2Sign </span> </a> </li> <li> <a href="/dataset/internvid"> <span class="badge badge-primary"> <img src="https://production-media.paperswithcode.com/tasks/default.gif"> InternVid </span> </a> </li> <li> <a href="/dataset/bair-robot-pushing"> <span class="badge badge-primary"> <img src="https://production-media.paperswithcode.com/tasks/default.gif"> BAIR Robot Pushing </span> </a> </li> <li> <a href="/dataset/celebv-text"> <span class="badge badge-primary"> <img src="https://production-media.paperswithcode.com/thumbnails/dataset/c37f7b7d-8503-4480-b851-392a9dae4373.jpg"> CelebV-Text </span> </a> </li> <a href="/datasets?task=video-generation"> <button class="dropdown-toggle badge badge-edit w-100 collapsed" type="button" > See all 15 video generation datasets </button> </a> </ul> </div> </div> </div> <!-- Subtasks --> <div class="title"> <h2 id="subtasks">Subtasks</h2> <hr> <div class="task-subtasks"> <div class="col-md-12"> <ul class="list-unstyled"> <li> <a href="/task/image-to-video"> <span class="badge badge-primary"> <img src="https://production-media.paperswithcode.com/tasks/default.gif"> <span>Image to Video Generation</span> </span> </a> </li> <li> <a href="/task/unconditional-video-generation"> <span class="badge badge-primary"> <img src="https://production-media.paperswithcode.com/thumbnails/task/4038fa4a-69b4-4073-8281-4ae128c34f14.jpg"> <span>Unconditional Video Generation</span> </span> </a> </li> </ul> </div> </div> </div> <!-- Papers --> <div class="title paper-list" id="code"> <h2 id="papers-list" class="home-page-title">Most implemented papers</h2> <div class="paper-filter-btn"> <div class="btn-group" role="group"> <a data-title="Most implemented papers" data-call-url="/tasklist/video-generation/greatest" data-target="/task/video-generation" class="list-papers-button list-button-active" style="margin-right:0">Most implemented</a> <a data-title="Hot papers on social media" data-call-url="/tasklist/video-generation/social" data-target="/task/video-generation/social" class="list-papers-button list-button" style="margin-right:0">Social</a> <a data-title="Latest papers" data-call-url="/tasklist/video-generation/latest" data-target="/task/video-generation/latest" class="list-papers-button list-button" style="margin-right:0">Latest</a> <a data-title="Latest papers with no code" data-call-url="/tasklist/video-generation/codeless" data-target="/task/video-generation/codeless" class="list-papers-button list-button">No code</a> </div> </div> </div> <!-- <input id="paper-list-search" type="search" class="form-control form-control-sm" placeholder="Search for a paper, author or keyword"> --> <input id="paper-list-search" type="search" class="form-control form-control-sm" placeholder="Search for a paper, author or keyword"> <div class="loading-tab" style="display: none"> <div class="loader-ellips"> <span class="loader-ellips__dot"></span> <span class="loader-ellips__dot"></span> <span class="loader-ellips__dot"></span> <span class="loader-ellips__dot"></span> </div> </div> <div id="task-papers-list"> <div class="infinite-container text-center"> <div class="paper-card infinite-item"> <!-- None --> <div class="container-fluid"> <div class="row"> <div class="col-lg-3"> <a href="/paper/gans-trained-by-a-two-time-scale-update-rule"> <div class="item-image" style="background-image: url('https://production-media.paperswithcode.com/thumbnails/paper/1706.08500.jpg');"> </div> </a> </div> <div class="col-lg-9"> <div class="row"> <div class="col-lg-9 item-content"> <h1><a href="/paper/gans-trained-by-a-two-time-scale-update-rule">GANs Trained by a Two Time-Scale Update Rule Converge to a Local Nash Equilibrium</a></h1> <p class="author-section" style="padding-top:2px"> <span class="item-github-link"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> <a href="https://github.com/bioinf-jku/TTUR" onclick="captureOutboundLink('https://github.com/bioinf-jku/TTUR'); return true;" style="font-size:13px"> bioinf-jku/TTUR </a> </span> • <span class="item-framework-link"> <img class="" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAbYAAABiBAMAAADO/+vOAAAACXBIWXMAAA7EAAAOxAGVKw4bAAAAMFBMVEVHcExBUGZCUGZKUmNCUGZCUGZCUGb/igD/jwD/hwD/iwBCUGb/kAD/hAD/mwD/eABjkbvFAAAAC3RSTlMAxZ4pVHvkPbaF3mTG43EAAAjMSURBVHja7Zy/b9tGFMdPImlD8CLXyaRFdRIvWhQrCVJosRMnixblh7NwcWNXixYDXRwvCZChQNGm3rq06RhkSGLJNhf9A2khc81iQWtaCJqDAILK+/2LEk+2AsQEr4BDU7w7fu579967d1YBSEpSkpKUpCSFlh/BdlzRbn4AP+/FEy3T+QB++SeWys2+gWwn74uxRDsJ2Nrtv2OHZv3a6RxD3U7iB/dnp0N0a7dfxQtttwML1A3C/RQvtEEwJZFuEK73LD5oO92BpFu7Fxs3lxkOoG4drpv/X0zcXOZdp9uFsh1z3fyPsYCbfTccIjRBt16v/zEOaL8Nu12sG19vvu/3/z3/bH8Nh4PBQLGTgW5+/1UM0LpDIpusW79/zt3c7jAoAdqA2cljplu/f67d3A5EGxDdTlTd+v1z7OYywyGBU/wbLJBNdnOLeslP/6WWlS4ASM/Pz184FdqAognrrY3IgiK6Oaull/3ps1WULgBIBT+PJmzlKZYN+gDZTgZTskfono1nO/ja2QIfIPk3n+sWxfa169btDvGcZHbS96kxiYNuEE6xk34sdBsMBgMpnvTbvX5MdOsOFDvZY1NSct9ruNwNuvLI9cqXYTta4+WMun1+ItvJ9ndhdpIW2FXjyzndijYdzqTbXqYj20mwE2InzyXbc5CR4xI/CDTjwfYKpsvleDL48GUc2F7D6Ksj7QN8aBVfGLLd+XZ+8Tb9pVQqIpN6f3FdNDPXlN+DJ+6sPywqDV9fvFKMZrPX19eKZmyfUGQp7996aEP+1oTNLiBDfZH8Cn8rguU6vHeJcSxJz8CyCm94l8lvaYRzNfhZjWKz7qGauG27Vqs9xvdnarUtfHU3uFlFbJ+2AdVNsJM4lDZgs3LEC20JbA65V1We4WP/SK6F2JyWAZtVIDUXqMf12ExuiMMbsH3Gcb5mJxlcBNtd5mLxbgdirFCWJn7GZc8skFpXlTuQ7dAlrYxl422hgasjDkqEH6mjq4CNbD4VO9kj83knis3h4UOTdXGP3VtRnvFwu7Z6B7I1WwZsaV6zQbtbYUQrVMsGZHtOd3KKnXxNUw4RbK4QG1VpZ7xsqM9saFHVgfzKEWxi81nSUp4NF7sKHn7KMlmqbiwN9HIsGxGgzt9SZjuiUah3ZT3HxJXiUiScKZsj1oRtzdHxctjIYbsEnvAduJLnalO9ZvfGsd2ALf5QBNfr9BZeahdLJWzOSF/eCrUCkGQGTanbpVts+E3ZkODN26VVOuNT9NkZNropNj1E3eT85Og0EGcr0Ks0XV0FZv0qBAX2usmeqZJJiuRCJuWQsXlX1qATHMOGhrBIB3UDywUbAGVmh+eYXRuhW7APGH3awdgsOu6YKUv+xfbBIbgV5gxy+H2UWlTblleNiksc2R4f4baabFE3aPUVTTc5P9n/WIxiS3PTVyYvVOAvRmRymZl28V7W4U4pRfgR22bo/u1AYJvhRuwG3tlBJYW1UARifyPsZBvCbUexzXG/kyaTI8dnBLnkfRH+GcETEwnZlB7PJihqkxo54ta4qc6pwW5Gz08asFV4UsEmk6PA2cg0dXmAAiSJAZc5LUZxo9kKbDLjpZdlM9DmbkGLq/X11h9tTVKi58xyBRoym8t73xSru8IbVrDcaR7EjGOrC8Pk4sVbxreCBrwCGmiLWpcxdtJEt5zQF1lEOtucFDYrtcisNmOzxJkrTPAs+ueogqAcLUGl+TeYL4nUDfb1oIQLWds5jQ3b92+46aoLb5jCUGZsdovFjHhUiOL7iPRgjjWVBRF20o/UTct7heoGcNTC6VqCISMLTWNrzNOSldk8xS/YGD/oayONPp1Rl7dmJ32/F62bxlYMZbtBP77EbSNlI/5AYwv1b47K1mSmIxi/vI3aLasuQMuXoLxyFJttxmbV6ecXGBsQ2FqTsDFrSqsgk2+haY4Uqwj8IHT/htKT26dg09ebGOFuAmXVnJ3NhSwOaiUH+ysILYXaSf+PKeoGcChNw9sp6UbnJJqDKXTtwno51QVodtJ64Ruut3mhjGID9hJhOwxh807NRuOw6hxquQx/6nl8NS4Bsy98MzYlaR7OBsA1TOeF2EljNslO0sgNVs1XUA2onq3ucMLyk7NvzfybwpYbwUYnZlX3bw1TNivEvyHgjQLqCerqaC4gLD+ZiWarq1ul0brR5blhFpeE73FC4hIEfFBHLcLLVX24w/KTN43iyX1jNhpam8ST4WxqPLlPBrhJZnlwuSRIG24n22NTtozN1XPZGttMrVbb4PUO5Hcno2PI5gqLKUdHqCBnvfR0fnh+MoqtzPemANwKX29z/E3TPLxt6vs3A7Yyj/Ftllmr8LRuRcnwhsclZmzplrjJyYfqlpL3r2SzRgxlWth3G7CllB07W7JiQkg7yg05xzFgs1piprIRyubIeQeywyI7OlfIlxiw2XKmpckpefpOcwGn1E3Iaq0KuSDZljASm5rVAsnqgWUxz2XAhmY8ynMtc4GclpR21Sx3qJ00YMMh/uP1O0stPV/i8pxC63LgvXPUhKOp4z1U8pMmbGWSn7xV5xAWz86DVojHPaWdVHY5+VDdUmLueUxe2YRNyis3hL2ux41nqzgVOynvkZvh/o1vcdgyE2sdggnYpJT8puBHhBMjD0xnveE1JB5Sjdubhp3jtIoTsYnnOEXZ/9M52wRTsZPSSdrWyHiyoJzRibgLYCI2QfK8mBPc5w8ejtHteBLdyOEuPPEYHXPJZ53S2dYWmJCNtXVB+jTLt0z74CzrDf6pJj+7vp4jhhCV+4uLi8RQrQaP5YUz6u8fCCf5+PyR1nLEFmG9Ba1DymI9Es67ceUgqiNdWsFlHoy3k/5Ef+5wbS3y7wastbUSiPw7BbNiT1hT3XeDGJWJ7OS5Y5PsZC/GusVqTqKvZPL1Fq8vZaKv0lLdXoN4ldk3TLf4fQk6g7/ffdx+vw3iB4d1i+f/dGAHsrX3QCzLbsD2DMS0/B78l5SkJCUpSUlKUpKSlGmW/wErOKTxUOS81gAAAABJRU5ErkJggg==" /> </span> • <span class="item-conference-link"> <a href="/conference/neurips-2017-12"> NeurIPS 2017 </a> </span> </p> <p class="item-strip-abstract">Generative Adversarial Networks (GANs) excel at creating realistic images with complex models for which maximum likelihood is infeasible.</p> </div> <div class="col-lg-3 item-interact text-center"> <div class="entity-stars"> <span class="badge badge-secondary"><span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> 69</span> </div> <div class="entity" style="margin-bottom: 20px;"> <a href="/paper/gans-trained-by-a-two-time-scale-update-rule" class="badge badge-light "> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> Paper </a> <br/> <a href="/paper/gans-trained-by-a-two-time-scale-update-rule#code" class="badge badge-dark "> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> Code </a> <br/> </div> </div> </div> </div> </div> </div> </div> <div class="paper-card infinite-item"> <!-- None --> <div class="container-fluid"> <div class="row"> <div class="col-lg-3"> <a href="/paper/consistency-models"> <div class="item-image" style="background-image: url('https://production-media.paperswithcode.com/thumbnails/paper/2303.01469.jpg');"> </div> </a> </div> <div class="col-lg-9"> <div class="row"> <div class="col-lg-9 item-content"> <h1><a href="/paper/consistency-models">Consistency Models</a></h1> <p class="author-section" style="padding-top:2px"> <span class="item-github-link"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> <a href="https://github.com/openai/consistency_models" onclick="captureOutboundLink('https://github.com/openai/consistency_models'); return true;" style="font-size:13px"> openai/consistency_models </a> </span> • <span class="item-framework-link"> <img class="" src="https://production-assets.paperswithcode.com/perf/images/frameworks/pytorch-2fbf2cb9.png" /> </span> • <span class="author-name-text item-date-pub">2 Mar 2023</span> </p> <p class="item-strip-abstract">Through extensive experiments, we demonstrate that they outperform existing distillation techniques for diffusion models in one- and few-step sampling, achieving the new state-of-the-art FID of 3. 55 on CIFAR-10 and 6. 20 on ImageNet 64x64 for one-step generation.</p> </div> <div class="col-lg-3 item-interact text-center"> <div class="entity-stars"> <span class="badge badge-secondary"><span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> 14</span> </div> <div class="entity" style="margin-bottom: 20px;"> <a href="/paper/consistency-models" class="badge badge-light "> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> Paper </a> <br/> <a href="/paper/consistency-models#code" class="badge badge-dark "> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> Code </a> <br/> </div> </div> </div> </div> </div> </div> </div> <div class="paper-card infinite-item"> <!-- None --> <div class="container-fluid"> <div class="row"> <div class="col-lg-3"> <a href="/paper/everybody-dance-now"> <div class="item-image" style="background-image: url('https://production-media.paperswithcode.com/thumbnails/paper/1808.07371.jpg');"> </div> </a> </div> <div class="col-lg-9"> <div class="row"> <div class="col-lg-9 item-content"> <h1><a href="/paper/everybody-dance-now">Everybody Dance Now</a></h1> <p class="author-section" style="padding-top:2px"> <span class="item-github-link"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> <a href="https://github.com/carolineec/EverybodyDanceNow" onclick="captureOutboundLink('https://github.com/carolineec/EverybodyDanceNow'); return true;" style="font-size:13px"> carolineec/EverybodyDanceNow </a> </span> • <span class="item-framework-link"> <img class="" src="https://production-assets.paperswithcode.com/perf/images/frameworks/pytorch-2fbf2cb9.png" /> </span> • <span class="item-conference-link"> <a href="/conference/iccv-2019-10"> ICCV 2019 </a> </span> </p> <p class="item-strip-abstract">This paper presents a simple method for &quot;do as I do&quot; motion transfer: given a source video of a person dancing, we can transfer that performance to a novel (amateur) target after only a few minutes of the target subject performing standard moves.</p> </div> <div class="col-lg-3 item-interact text-center"> <div class="entity-stars"> <span class="badge badge-secondary"><span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> 13</span> </div> <div class="entity" style="margin-bottom: 20px;"> <a href="/paper/everybody-dance-now" class="badge badge-light "> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> Paper </a> <br/> <a href="/paper/everybody-dance-now#code" class="badge badge-dark "> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> Code </a> <br/> </div> </div> </div> </div> </div> </div> </div> <div class="paper-card infinite-item"> <!-- None --> <div class="container-fluid"> <div class="row"> <div class="col-lg-3"> <a href="/paper/temporally-coherent-gans-for-video-super"> <div class="item-image" style="background-image: url('https://production-media.paperswithcode.com/thumbnails/paper/1811.09393.jpg');"> </div> </a> </div> <div class="col-lg-9"> <div class="row"> <div class="col-lg-9 item-content"> <h1><a href="/paper/temporally-coherent-gans-for-video-super">Learning Temporal Coherence via Self-Supervision for GAN-based Video Generation</a></h1> <p class="author-section" style="padding-top:2px"> <span class="item-github-link"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> <a href="https://github.com/thunil/TecoGAN" onclick="captureOutboundLink('https://github.com/thunil/TecoGAN'); return true;" style="font-size:13px"> thunil/TecoGAN </a> </span> • <span class="item-framework-link"> <img class="" src="https://production-assets.paperswithcode.com/perf/images/frameworks/pytorch-2fbf2cb9.png" /> </span> • <span class="author-name-text item-date-pub">23 Nov 2018</span> </p> <p class="item-strip-abstract">Additionally, we propose a first set of metrics to quantitatively evaluate the accuracy as well as the perceptual quality of the temporal evolution.</p> </div> <div class="col-lg-3 item-interact text-center"> <div class="entity-stars"> <span class="badge badge-secondary"><span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> 13</span> </div> <div class="entity" style="margin-bottom: 20px;"> <a href="/paper/temporally-coherent-gans-for-video-super" class="badge badge-light "> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> Paper </a> <br/> <a href="/paper/temporally-coherent-gans-for-video-super#code" class="badge badge-dark "> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> Code </a> <br/> </div> </div> </div> </div> </div> </div> </div> <div class="paper-card infinite-item"> <!-- None --> <div class="container-fluid"> <div class="row"> <div class="col-lg-3"> <a href="/paper/mocogan-decomposing-motion-and-content-for"> <div class="item-image" style="background-image: url('https://production-media.paperswithcode.com/thumbnails/paper/1707.04993.jpg');"> </div> </a> </div> <div class="col-lg-9"> <div class="row"> <div class="col-lg-9 item-content"> <h1><a href="/paper/mocogan-decomposing-motion-and-content-for">MoCoGAN: Decomposing Motion and Content for Video Generation</a></h1> <p class="author-section" style="padding-top:2px"> <span class="item-github-link"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> <a href="https://github.com/sergeytulyakov/mocogan" onclick="captureOutboundLink('https://github.com/sergeytulyakov/mocogan'); return true;" style="font-size:13px"> sergeytulyakov/mocogan </a> </span> • <span class="item-framework-link"> <img class="" src="https://production-assets.paperswithcode.com/perf/images/frameworks/pytorch-2fbf2cb9.png" /> </span> • <span class="item-conference-link"> <a href="/conference/cvpr-2018-6"> CVPR 2018 </a> </span> </p> <p class="item-strip-abstract">The proposed framework generates a video by mapping a sequence of random vectors to a sequence of video frames.</p> </div> <div class="col-lg-3 item-interact text-center"> <div class="entity-stars"> <span class="badge badge-secondary"><span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> 5</span> </div> <div class="entity" style="margin-bottom: 20px;"> <a href="/paper/mocogan-decomposing-motion-and-content-for" class="badge badge-light "> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> Paper </a> <br/> <a href="/paper/mocogan-decomposing-motion-and-content-for#code" class="badge badge-dark "> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> Code </a> <br/> </div> </div> </div> </div> </div> </div> </div> <div class="paper-card infinite-item"> <!-- None --> <div class="container-fluid"> <div class="row"> <div class="col-lg-3"> <a href="/paper/temporal-generative-adversarial-nets-with"> <div class="item-image" style="background-image: url('https://production-media.paperswithcode.com/thumbnails/paper/1611.06624.jpg');"> </div> </a> </div> <div class="col-lg-9"> <div class="row"> <div class="col-lg-9 item-content"> <h1><a href="/paper/temporal-generative-adversarial-nets-with">Temporal Generative Adversarial Nets with Singular Value Clipping</a></h1> <p class="author-section" style="padding-top:2px"> <span class="item-github-link"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> <a href="https://github.com/universome/stylegan-v" onclick="captureOutboundLink('https://github.com/universome/stylegan-v'); return true;" style="font-size:13px"> universome/stylegan-v </a> </span> • <span class="item-framework-link"> <img class="" src="https://production-assets.paperswithcode.com/perf/images/frameworks/pytorch-2fbf2cb9.png" /> </span> • <span class="item-conference-link"> <a href="/conference/iccv-2017-10"> ICCV 2017 </a> </span> </p> <p class="item-strip-abstract">In this paper, we propose a generative model, Temporal Generative Adversarial Nets (TGAN), which can learn a semantic representation of unlabeled videos, and is capable of generating videos.</p> </div> <div class="col-lg-3 item-interact text-center"> <div class="entity-stars"> <span class="badge badge-secondary"><span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> 4</span> </div> <div class="entity" style="margin-bottom: 20px;"> <a href="/paper/temporal-generative-adversarial-nets-with" class="badge badge-light "> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> Paper </a> <br/> <a href="/paper/temporal-generative-adversarial-nets-with#code" class="badge badge-dark "> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> Code </a> <br/> </div> </div> </div> </div> </div> </div> </div> <div class="paper-card infinite-item"> <!-- None --> <div class="container-fluid"> <div class="row"> <div class="col-lg-3"> <a href="/paper/stochastic-adversarial-video-prediction"> <div class="item-image" style="background-image: url('https://production-media.paperswithcode.com/thumbnails/paper/1804.01523.jpg');"> </div> </a> </div> <div class="col-lg-9"> <div class="row"> <div class="col-lg-9 item-content"> <h1><a href="/paper/stochastic-adversarial-video-prediction">Stochastic Adversarial Video Prediction</a></h1> <p class="author-section" style="padding-top:2px"> <span class="item-github-link"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> <a href="https://github.com/alexlee-gk/video_prediction" onclick="captureOutboundLink('https://github.com/alexlee-gk/video_prediction'); return true;" style="font-size:13px"> alexlee-gk/video_prediction </a> </span> • <span class="item-framework-link"> <img class="" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAbYAAABiBAMAAADO/+vOAAAACXBIWXMAAA7EAAAOxAGVKw4bAAAAMFBMVEVHcExBUGZCUGZKUmNCUGZCUGZCUGb/igD/jwD/hwD/iwBCUGb/kAD/hAD/mwD/eABjkbvFAAAAC3RSTlMAxZ4pVHvkPbaF3mTG43EAAAjMSURBVHja7Zy/b9tGFMdPImlD8CLXyaRFdRIvWhQrCVJosRMnixblh7NwcWNXixYDXRwvCZChQNGm3rq06RhkSGLJNhf9A2khc81iQWtaCJqDAILK+/2LEk+2AsQEr4BDU7w7fu579967d1YBSEpSkpKUpCSFlh/BdlzRbn4AP+/FEy3T+QB++SeWys2+gWwn74uxRDsJ2Nrtv2OHZv3a6RxD3U7iB/dnp0N0a7dfxQtttwML1A3C/RQvtEEwJZFuEK73LD5oO92BpFu7Fxs3lxkOoG4drpv/X0zcXOZdp9uFsh1z3fyPsYCbfTccIjRBt16v/zEOaL8Nu12sG19vvu/3/z3/bH8Nh4PBQLGTgW5+/1UM0LpDIpusW79/zt3c7jAoAdqA2cljplu/f67d3A5EGxDdTlTd+v1z7OYywyGBU/wbLJBNdnOLeslP/6WWlS4ASM/Pz184FdqAognrrY3IgiK6Oaull/3ps1WULgBIBT+PJmzlKZYN+gDZTgZTskfono1nO/ja2QIfIPk3n+sWxfa169btDvGcZHbS96kxiYNuEE6xk34sdBsMBgMpnvTbvX5MdOsOFDvZY1NSct9ruNwNuvLI9cqXYTta4+WMun1+ItvJ9ndhdpIW2FXjyzndijYdzqTbXqYj20mwE2InzyXbc5CR4xI/CDTjwfYKpsvleDL48GUc2F7D6Ksj7QN8aBVfGLLd+XZ+8Tb9pVQqIpN6f3FdNDPXlN+DJ+6sPywqDV9fvFKMZrPX19eKZmyfUGQp7996aEP+1oTNLiBDfZH8Cn8rguU6vHeJcSxJz8CyCm94l8lvaYRzNfhZjWKz7qGauG27Vqs9xvdnarUtfHU3uFlFbJ+2AdVNsJM4lDZgs3LEC20JbA65V1We4WP/SK6F2JyWAZtVIDUXqMf12ExuiMMbsH3Gcb5mJxlcBNtd5mLxbgdirFCWJn7GZc8skFpXlTuQ7dAlrYxl422hgasjDkqEH6mjq4CNbD4VO9kj83knis3h4UOTdXGP3VtRnvFwu7Z6B7I1WwZsaV6zQbtbYUQrVMsGZHtOd3KKnXxNUw4RbK4QG1VpZ7xsqM9saFHVgfzKEWxi81nSUp4NF7sKHn7KMlmqbiwN9HIsGxGgzt9SZjuiUah3ZT3HxJXiUiScKZsj1oRtzdHxctjIYbsEnvAduJLnalO9ZvfGsd2ALf5QBNfr9BZeahdLJWzOSF/eCrUCkGQGTanbpVts+E3ZkODN26VVOuNT9NkZNropNj1E3eT85Og0EGcr0Ks0XV0FZv0qBAX2usmeqZJJiuRCJuWQsXlX1qATHMOGhrBIB3UDywUbAGVmh+eYXRuhW7APGH3awdgsOu6YKUv+xfbBIbgV5gxy+H2UWlTblleNiksc2R4f4baabFE3aPUVTTc5P9n/WIxiS3PTVyYvVOAvRmRymZl28V7W4U4pRfgR22bo/u1AYJvhRuwG3tlBJYW1UARifyPsZBvCbUexzXG/kyaTI8dnBLnkfRH+GcETEwnZlB7PJihqkxo54ta4qc6pwW5Gz08asFV4UsEmk6PA2cg0dXmAAiSJAZc5LUZxo9kKbDLjpZdlM9DmbkGLq/X11h9tTVKi58xyBRoym8t73xSru8IbVrDcaR7EjGOrC8Pk4sVbxreCBrwCGmiLWpcxdtJEt5zQF1lEOtucFDYrtcisNmOzxJkrTPAs+ueogqAcLUGl+TeYL4nUDfb1oIQLWds5jQ3b92+46aoLb5jCUGZsdovFjHhUiOL7iPRgjjWVBRF20o/UTct7heoGcNTC6VqCISMLTWNrzNOSldk8xS/YGD/oayONPp1Rl7dmJ32/F62bxlYMZbtBP77EbSNlI/5AYwv1b47K1mSmIxi/vI3aLasuQMuXoLxyFJttxmbV6ecXGBsQ2FqTsDFrSqsgk2+haY4Uqwj8IHT/htKT26dg09ebGOFuAmXVnJ3NhSwOaiUH+ysILYXaSf+PKeoGcChNw9sp6UbnJJqDKXTtwno51QVodtJ64Ruut3mhjGID9hJhOwxh807NRuOw6hxquQx/6nl8NS4Bsy98MzYlaR7OBsA1TOeF2EljNslO0sgNVs1XUA2onq3ucMLyk7NvzfybwpYbwUYnZlX3bw1TNivEvyHgjQLqCerqaC4gLD+ZiWarq1ul0brR5blhFpeE73FC4hIEfFBHLcLLVX24w/KTN43iyX1jNhpam8ST4WxqPLlPBrhJZnlwuSRIG24n22NTtozN1XPZGttMrVbb4PUO5Hcno2PI5gqLKUdHqCBnvfR0fnh+MoqtzPemANwKX29z/E3TPLxt6vs3A7Yyj/Ftllmr8LRuRcnwhsclZmzplrjJyYfqlpL3r2SzRgxlWth3G7CllB07W7JiQkg7yg05xzFgs1piprIRyubIeQeywyI7OlfIlxiw2XKmpckpefpOcwGn1E3Iaq0KuSDZljASm5rVAsnqgWUxz2XAhmY8ynMtc4GclpR21Sx3qJ00YMMh/uP1O0stPV/i8pxC63LgvXPUhKOp4z1U8pMmbGWSn7xV5xAWz86DVojHPaWdVHY5+VDdUmLueUxe2YRNyis3hL2ux41nqzgVOynvkZvh/o1vcdgyE2sdggnYpJT8puBHhBMjD0xnveE1JB5Sjdubhp3jtIoTsYnnOEXZ/9M52wRTsZPSSdrWyHiyoJzRibgLYCI2QfK8mBPc5w8ejtHteBLdyOEuPPEYHXPJZ53S2dYWmJCNtXVB+jTLt0z74CzrDf6pJj+7vp4jhhCV+4uLi8RQrQaP5YUz6u8fCCf5+PyR1nLEFmG9Ba1DymI9Es67ceUgqiNdWsFlHoy3k/5Ef+5wbS3y7wastbUSiPw7BbNiT1hT3XeDGJWJ7OS5Y5PsZC/GusVqTqKvZPL1Fq8vZaKv0lLdXoN4ldk3TLf4fQk6g7/ffdx+vw3iB4d1i+f/dGAHsrX3QCzLbsD2DMS0/B78l5SkJCUpSUlKUpKSlGmW/wErOKTxUOS81gAAAABJRU5ErkJggg==" /> </span> • <span class="item-conference-link"> <a href="/conference/iclr-2019-5"> ICLR 2019 </a> </span> </p> <p class="item-strip-abstract">However, learning to predict raw future observations, such as frames in a video, is exceedingly challenging -- the ambiguous nature of the problem can cause a naively designed model to average together possible futures into a single, blurry prediction.</p> </div> <div class="col-lg-3 item-interact text-center"> <div class="entity-stars"> <span class="badge badge-secondary"><span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> 4</span> </div> <div class="entity" style="margin-bottom: 20px;"> <a href="/paper/stochastic-adversarial-video-prediction" class="badge badge-light "> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> Paper </a> <br/> <a href="/paper/stochastic-adversarial-video-prediction#code" class="badge badge-dark "> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> Code </a> <br/> </div> </div> </div> </div> </div> </div> </div> <div class="paper-card infinite-item"> <!-- None --> <div class="container-fluid"> <div class="row"> <div class="col-lg-3"> <a href="/paper/video-diffusion-models"> <div class="item-image" style="background-image: url('https://production-media.paperswithcode.com/thumbnails/paper/2204.03458.jpg');"> </div> </a> </div> <div class="col-lg-9"> <div class="row"> <div class="col-lg-9 item-content"> <h1><a href="/paper/video-diffusion-models">Video Diffusion Models</a></h1> <p class="author-section" style="padding-top:2px"> <span class="item-github-link"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> <a href="https://github.com/lucidrains/make-a-video-pytorch" onclick="captureOutboundLink('https://github.com/lucidrains/make-a-video-pytorch'); return true;" style="font-size:13px"> lucidrains/make-a-video-pytorch </a> </span> • <span class="item-framework-link"> <img class="" src="https://production-assets.paperswithcode.com/perf/images/frameworks/pytorch-2fbf2cb9.png" /> </span> • <span class="author-name-text item-date-pub">7 Apr 2022</span> </p> <p class="item-strip-abstract">Generating temporally coherent high fidelity video is an important milestone in generative modeling research.</p> </div> <div class="col-lg-3 item-interact text-center"> <div class="entity-stars"> <span class="badge badge-secondary"><span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> 4</span> </div> <div class="entity" style="margin-bottom: 20px;"> <a href="/paper/video-diffusion-models" class="badge badge-light "> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> Paper </a> <br/> <a href="/paper/video-diffusion-models#code" class="badge badge-dark "> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> Code </a> <br/> </div> </div> </div> </div> </div> </div> </div> <div class="paper-card infinite-item"> <!-- None --> <div class="container-fluid"> <div class="row"> <div class="col-lg-3"> <a href="/paper/collaborative-neural-rendering-using-anime"> <div class="item-image" style="background-image: url('https://production-media.paperswithcode.com/thumbnails/paper/2207.05378.jpg');"> </div> </a> </div> <div class="col-lg-9"> <div class="row"> <div class="col-lg-9 item-content"> <h1><a href="/paper/collaborative-neural-rendering-using-anime">Collaborative Neural Rendering using Anime Character Sheets</a></h1> <p class="author-section" style="padding-top:2px"> <span class="item-github-link"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> <a href="https://github.com/transpchan/Live3D" onclick="captureOutboundLink('https://github.com/transpchan/Live3D'); return true;" style="font-size:13px"> transpchan/Live3D </a> </span> • <span class="item-framework-link"> <img class="" src="https://production-assets.paperswithcode.com/perf/images/frameworks/pytorch-2fbf2cb9.png" /> </span> • <span class="author-name-text item-date-pub">12 Jul 2022</span> </p> <p class="item-strip-abstract">Drawing images of characters with desired poses is an essential but laborious task in anime production.</p> </div> <div class="col-lg-3 item-interact text-center"> <div class="entity-stars"> <span class="badge badge-secondary"><span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> 4</span> </div> <div class="entity" style="margin-bottom: 20px;"> <a href="/paper/collaborative-neural-rendering-using-anime" class="badge badge-light "> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> Paper </a> <br/> <a href="/paper/collaborative-neural-rendering-using-anime#code" class="badge badge-dark "> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> Code </a> <br/> </div> </div> </div> </div> </div> </div> </div> <div class="paper-card infinite-item"> <!-- None --> <div class="container-fluid"> <div class="row"> <div class="col-lg-3"> <a href="/paper/stochastic-variational-video-prediction"> <div class="item-image" style="background-image: url('https://production-media.paperswithcode.com/thumbnails/paper/1710.11252.jpg');"> </div> </a> </div> <div class="col-lg-9"> <div class="row"> <div class="col-lg-9 item-content"> <h1><a href="/paper/stochastic-variational-video-prediction">Stochastic Variational Video Prediction</a></h1> <p class="author-section" style="padding-top:2px"> <span class="item-github-link"> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> <a href="https://github.com/StanfordVL/roboturk_real_dataset" onclick="captureOutboundLink('https://github.com/StanfordVL/roboturk_real_dataset'); return true;" style="font-size:13px"> StanfordVL/roboturk_real_dataset </a> </span> • <span class="item-framework-link"> <img class="" src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAAbYAAABiBAMAAADO/+vOAAAACXBIWXMAAA7EAAAOxAGVKw4bAAAAMFBMVEVHcExBUGZCUGZKUmNCUGZCUGZCUGb/igD/jwD/hwD/iwBCUGb/kAD/hAD/mwD/eABjkbvFAAAAC3RSTlMAxZ4pVHvkPbaF3mTG43EAAAjMSURBVHja7Zy/b9tGFMdPImlD8CLXyaRFdRIvWhQrCVJosRMnixblh7NwcWNXixYDXRwvCZChQNGm3rq06RhkSGLJNhf9A2khc81iQWtaCJqDAILK+/2LEk+2AsQEr4BDU7w7fu579967d1YBSEpSkpKUpCSFlh/BdlzRbn4AP+/FEy3T+QB++SeWys2+gWwn74uxRDsJ2Nrtv2OHZv3a6RxD3U7iB/dnp0N0a7dfxQtttwML1A3C/RQvtEEwJZFuEK73LD5oO92BpFu7Fxs3lxkOoG4drpv/X0zcXOZdp9uFsh1z3fyPsYCbfTccIjRBt16v/zEOaL8Nu12sG19vvu/3/z3/bH8Nh4PBQLGTgW5+/1UM0LpDIpusW79/zt3c7jAoAdqA2cljplu/f67d3A5EGxDdTlTd+v1z7OYywyGBU/wbLJBNdnOLeslP/6WWlS4ASM/Pz184FdqAognrrY3IgiK6Oaull/3ps1WULgBIBT+PJmzlKZYN+gDZTgZTskfono1nO/ja2QIfIPk3n+sWxfa169btDvGcZHbS96kxiYNuEE6xk34sdBsMBgMpnvTbvX5MdOsOFDvZY1NSct9ruNwNuvLI9cqXYTta4+WMun1+ItvJ9ndhdpIW2FXjyzndijYdzqTbXqYj20mwE2InzyXbc5CR4xI/CDTjwfYKpsvleDL48GUc2F7D6Ksj7QN8aBVfGLLd+XZ+8Tb9pVQqIpN6f3FdNDPXlN+DJ+6sPywqDV9fvFKMZrPX19eKZmyfUGQp7996aEP+1oTNLiBDfZH8Cn8rguU6vHeJcSxJz8CyCm94l8lvaYRzNfhZjWKz7qGauG27Vqs9xvdnarUtfHU3uFlFbJ+2AdVNsJM4lDZgs3LEC20JbA65V1We4WP/SK6F2JyWAZtVIDUXqMf12ExuiMMbsH3Gcb5mJxlcBNtd5mLxbgdirFCWJn7GZc8skFpXlTuQ7dAlrYxl422hgasjDkqEH6mjq4CNbD4VO9kj83knis3h4UOTdXGP3VtRnvFwu7Z6B7I1WwZsaV6zQbtbYUQrVMsGZHtOd3KKnXxNUw4RbK4QG1VpZ7xsqM9saFHVgfzKEWxi81nSUp4NF7sKHn7KMlmqbiwN9HIsGxGgzt9SZjuiUah3ZT3HxJXiUiScKZsj1oRtzdHxctjIYbsEnvAduJLnalO9ZvfGsd2ALf5QBNfr9BZeahdLJWzOSF/eCrUCkGQGTanbpVts+E3ZkODN26VVOuNT9NkZNropNj1E3eT85Og0EGcr0Ks0XV0FZv0qBAX2usmeqZJJiuRCJuWQsXlX1qATHMOGhrBIB3UDywUbAGVmh+eYXRuhW7APGH3awdgsOu6YKUv+xfbBIbgV5gxy+H2UWlTblleNiksc2R4f4baabFE3aPUVTTc5P9n/WIxiS3PTVyYvVOAvRmRymZl28V7W4U4pRfgR22bo/u1AYJvhRuwG3tlBJYW1UARifyPsZBvCbUexzXG/kyaTI8dnBLnkfRH+GcETEwnZlB7PJihqkxo54ta4qc6pwW5Gz08asFV4UsEmk6PA2cg0dXmAAiSJAZc5LUZxo9kKbDLjpZdlM9DmbkGLq/X11h9tTVKi58xyBRoym8t73xSru8IbVrDcaR7EjGOrC8Pk4sVbxreCBrwCGmiLWpcxdtJEt5zQF1lEOtucFDYrtcisNmOzxJkrTPAs+ueogqAcLUGl+TeYL4nUDfb1oIQLWds5jQ3b92+46aoLb5jCUGZsdovFjHhUiOL7iPRgjjWVBRF20o/UTct7heoGcNTC6VqCISMLTWNrzNOSldk8xS/YGD/oayONPp1Rl7dmJ32/F62bxlYMZbtBP77EbSNlI/5AYwv1b47K1mSmIxi/vI3aLasuQMuXoLxyFJttxmbV6ecXGBsQ2FqTsDFrSqsgk2+haY4Uqwj8IHT/htKT26dg09ebGOFuAmXVnJ3NhSwOaiUH+ysILYXaSf+PKeoGcChNw9sp6UbnJJqDKXTtwno51QVodtJ64Ruut3mhjGID9hJhOwxh807NRuOw6hxquQx/6nl8NS4Bsy98MzYlaR7OBsA1TOeF2EljNslO0sgNVs1XUA2onq3ucMLyk7NvzfybwpYbwUYnZlX3bw1TNivEvyHgjQLqCerqaC4gLD+ZiWarq1ul0brR5blhFpeE73FC4hIEfFBHLcLLVX24w/KTN43iyX1jNhpam8ST4WxqPLlPBrhJZnlwuSRIG24n22NTtozN1XPZGttMrVbb4PUO5Hcno2PI5gqLKUdHqCBnvfR0fnh+MoqtzPemANwKX29z/E3TPLxt6vs3A7Yyj/Ftllmr8LRuRcnwhsclZmzplrjJyYfqlpL3r2SzRgxlWth3G7CllB07W7JiQkg7yg05xzFgs1piprIRyubIeQeywyI7OlfIlxiw2XKmpckpefpOcwGn1E3Iaq0KuSDZljASm5rVAsnqgWUxz2XAhmY8ynMtc4GclpR21Sx3qJ00YMMh/uP1O0stPV/i8pxC63LgvXPUhKOp4z1U8pMmbGWSn7xV5xAWz86DVojHPaWdVHY5+VDdUmLueUxe2YRNyis3hL2ux41nqzgVOynvkZvh/o1vcdgyE2sdggnYpJT8puBHhBMjD0xnveE1JB5Sjdubhp3jtIoTsYnnOEXZ/9M52wRTsZPSSdrWyHiyoJzRibgLYCI2QfK8mBPc5w8ejtHteBLdyOEuPPEYHXPJZ53S2dYWmJCNtXVB+jTLt0z74CzrDf6pJj+7vp4jhhCV+4uLi8RQrQaP5YUz6u8fCCf5+PyR1nLEFmG9Ba1DymI9Es67ceUgqiNdWsFlHoy3k/5Ef+5wbS3y7wastbUSiPw7BbNiT1hT3XeDGJWJ7OS5Y5PsZC/GusVqTqKvZPL1Fq8vZaKv0lLdXoN4ldk3TLf4fQk6g7/ffdx+vw3iB4d1i+f/dGAHsrX3QCzLbsD2DMS0/B78l5SkJCUpSUlKUpKSlGmW/wErOKTxUOS81gAAAABJRU5ErkJggg==" /> </span> • <span class="item-conference-link"> <a href="/conference/iclr-2018-1"> ICLR 2018 </a> </span> </p> <p class="item-strip-abstract">We find that our proposed method produces substantially improved video predictions when compared to the same model without stochasticity, and to other stochastic video prediction methods.</p> </div> <div class="col-lg-3 item-interact text-center"> <div class="entity-stars"> <span class="badge badge-secondary"><span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> 3</span> </div> <div class="entity" style="margin-bottom: 20px;"> <a href="/paper/stochastic-variational-video-prediction" class="badge badge-light "> <span class=" icon-wrapper icon-ion" data-name="document"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M428 224H288a48 48 0 0 1-48-48V36a4 4 0 0 0-4-4h-92a64 64 0 0 0-64 64v320a64 64 0 0 0 64 64h224a64 64 0 0 0 64-64V228a4 4 0 0 0-4-4z"/><path d="M419.22 188.59L275.41 44.78a2 2 0 0 0-3.41 1.41V176a16 16 0 0 0 16 16h129.81a2 2 0 0 0 1.41-3.41z"/></svg></span> Paper </a> <br/> <a href="/paper/stochastic-variational-video-prediction#code" class="badge badge-dark "> <span class=" icon-wrapper icon-ion" data-name="logo-github"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M256 32C132.3 32 32 134.9 32 261.7c0 101.5 64.2 187.5 153.2 217.9a17.56 17.56 0 0 0 3.8.4c8.3 0 11.5-6.1 11.5-11.4 0-5.5-.2-19.9-.3-39.1a102.4 102.4 0 0 1-22.6 2.7c-43.1 0-52.9-33.5-52.9-33.5-10.2-26.5-24.9-33.6-24.9-33.6-19.5-13.7-.1-14.1 1.4-14.1h.1c22.5 2 34.3 23.8 34.3 23.8 11.2 19.6 26.2 25.1 39.6 25.1a63 63 0 0 0 25.6-6c2-14.8 7.8-24.9 14.2-30.7-49.7-5.8-102-25.5-102-113.5 0-25.1 8.7-45.6 23-61.6-2.3-5.8-10-29.2 2.2-60.8a18.64 18.64 0 0 1 5-.5c8.1 0 26.4 3.1 56.6 24.1a208.21 208.21 0 0 1 112.2 0c30.2-21 48.5-24.1 56.6-24.1a18.64 18.64 0 0 1 5 .5c12.2 31.6 4.5 55 2.2 60.8 14.3 16.1 23 36.6 23 61.6 0 88.2-52.4 107.6-102.3 113.3 8 7.1 15.2 21.1 15.2 42.5 0 30.7-.3 55.5-.3 63 0 5.4 3.1 11.5 11.4 11.5a19.35 19.35 0 0 0 4-.4C415.9 449.2 480 363.1 480 261.7 480 134.9 379.7 32 256 32z"/></svg></span> Code </a> <br/> </div> </div> </div> </div> </div> </div> </div> </div> <div class="loading" style="display: none"> <div class="loader-ellips infinite-scroll-request"> <span class="loader-ellips__dot"></span> <span class="loader-ellips__dot"></span> <span class="loader-ellips__dot"></span> <span class="loader-ellips__dot"></span> </div> </div> <a class="infinite-more-link" href="?page=2&q="></a> </div> <div class="loading-trigger"></div> </div> <div class="col-lg-3 wide-sidebar task-infobox" id="task-sidebar"> <div class="image-container"> <a href="https://production-media.paperswithcode.com/thumbnails/task/11ba3d1a-5ca7-459a-a0dd-658050e2c75b.gif" data-lightbox="imageresource"> <img id="imageresource" width=100% src="https://production-media.paperswithcode.com/thumbnails/task/11ba3d1a-5ca7-459a-a0dd-658050e2c75b.gif"> </a> </div> <div class="task-toc"> <h4>Content</h4> <hr> <nav> <a class="toc-link" href="#task-home"><span class=" icon-wrapper icon-fa icon-fa-light" data-name="book"><svg viewBox="0 0 448 520.146" xmlns="http://www.w3.org/2000/svg"><path d="M356 161H188c-6.6 0-12-5.4-12-12v-8c0-6.6 5.4-12 12-12h168c6.6 0 12 5.4 12 12v8c0 6.6-5.4 12-12 12zm12 52c0 6.6-5.4 12-12 12H188c-6.6 0-12-5.4-12-12v-8c0-6.6 5.4-12 12-12h168c6.6 0 12 5.4 12 12v8zm64.7 268h3.3c6.6 0 12 5.4 12 12v8c0 6.6-5.4 12-12 12H80c-44.2 0-80-35.8-80-80V81C0 36.8 35.8 1 80 1h344c13.3 0 24 10.7 24 24v368c0 10-6.2 18.6-14.9 22.2-3.6 16.1-4.4 45.6-.4 65.8zM128 385h288V33H128v352zm-96 16c13.4-10 30-16 48-16h16V33H80c-26.5 0-48 21.5-48 48v320zm372.3 80c-3.1-20.4-2.9-45.2 0-64H80c-64 0-64 64 0 64h324.3z"/></svg></span> Introduction</a> <a class="toc-link" href="#benchmarks"><span class=" icon-wrapper icon-fa icon-fa-light" data-name="chart-line"><svg viewBox="0 0 512 520.146" xmlns="http://www.w3.org/2000/svg"><path d="M504 417c4.42 0 8 3.58 8 8v16c0 4.42-3.58 8-8 8H16c-8.84 0-16-7.16-16-16V73c0-4.42 3.58-8 8-8h16c4.42 0 8 3.58 8 8v344h472zM98.34 264.03l84.12-83.32c6.25-6.2 16.34-6.18 22.57.05l84.63 84.63 82.22-82.22-44.71-44.71C311.87 123.16 322.7 97 344.34 97h119.47c8.94 0 16.19 7.25 16.19 16.19v119.47c0 14.64-11.98 24.34-24.46 24.34-5.97 0-12.05-2.21-17-7.16L394.5 205.8l-93.53 93.53c-6.25 6.25-16.38 6.25-22.63 0l-84.69-84.69-72.69 72.01c-3.12 3.12-8.19 3.12-11.31 0l-11.31-11.31c-3.12-3.12-3.12-8.19 0-11.31zM362.96 129L448 214.04V129h-85.04z"/></svg></span> Benchmarks</a> <a class="toc-link" href="#datasets"><span class=" icon-wrapper icon-fa icon-fa-light" data-name="database"><svg viewBox="0 0 448 520.146" xmlns="http://www.w3.org/2000/svg"><path d="M224 33C118 33 32 61.75 32 97v32c0 35.25 86 64 192 64s192-28.75 192-64V97c0-35.25-86-64-192-64zm192 149.5c-41.251 29-116.75 42.5-192 42.5S73.25 211.5 32 182.5V225c0 35.25 86 64 192 64s192-28.75 192-64v-42.5zm0 96c-41.251 29-116.75 42.5-192 42.5S73.25 307.5 32 278.5V321c0 35.25 86 64 192 64s192-28.75 192-64v-42.5zm0 96c-41.251 29-116.75 42.5-192 42.5S73.25 403.5 32 374.5V417c0 35.25 86 64 192 64s192-28.75 192-64v-42.5zM224 1c77.904 0 224 18.662 224 96v320c0 77.2-145.858 96-224 96-77.904 0-224-18.662-224-96V97C0 19.8 145.858 1 224 1z"/></svg></span> Datasets</a> <a class="toc-link" href="#subtasks"><span class=" icon-wrapper icon-fa icon-fa-light" data-name="sitemap"><svg viewBox="0 0 640 520.146" xmlns="http://www.w3.org/2000/svg"><path d="M608 353c17.67 0 32 14.33 32 32v96c0 17.67-14.33 32-32 32h-96c-17.67 0-32-14.33-32-32v-96c0-17.67 14.33-32 32-32h32v-96H336v96h32c17.67 0 32 14.33 32 32v96c0 17.67-14.33 32-32 32h-96c-17.67 0-32-14.33-32-32v-96c0-17.67 14.33-32 32-32h32v-96H96v96h32c17.67 0 32 14.33 32 32v96c0 17.67-14.33 32-32 32H32c-17.67 0-32-14.33-32-32v-96c0-17.67 14.33-32 32-32h32v-97.59C64 238.64 77.62 225 94.41 225H304v-64h-48c-17.67 0-32-14.33-32-32V33c0-17.67 14.33-32 32-32h128c17.67 0 32 14.33 32 32v96c0 17.67-14.33 32-32 32h-48v64h209.59c16.79 0 30.41 13.64 30.41 30.41V353h32zm-480 32H32v96h96v-96zm240 0h-96v96h96v-96zM256 129h128V33H256v96zm352 352v-96h-96v96h96z"/></svg></span> Subtasks</a> <a class="toc-link" href="#task-libraries"><span class=" icon-wrapper icon-fa icon-fa-light" data-name="file-code"><svg viewBox="0 0 384 520.146" xmlns="http://www.w3.org/2000/svg"><path d="M369.941 98.941c7.76 7.76 14.059 22.966 14.059 33.94V465c0 26.51-21.49 48-48 48H48c-26.51 0-48-21.49-48-48V49C0 22.49 21.49 1 48 1h204.118c10.975 0 26.18 6.3 33.94 14.059zm-22.627 22.628l-83.883-83.884c-1.728-1.73-5.057-3.608-7.431-4.194V129h95.509c-.586-2.374-2.465-5.703-4.195-7.431zM336 481c8.837 0 16-7.163 16-16V161H248c-13.254 0-24-10.745-24-24V33H48c-8.836 0-16 7.163-16 16v416c0 8.837 7.164 16 16 16h288zm-161.47-67.404l-25.93-7.527c-2.03-.59-3.677-2.784-3.677-4.898 0-.4.09-1.037.202-1.422l58.027-199.869c.59-2.03 2.784-3.678 4.898-3.678.4 0 1.038.09 1.422.202l25.928 7.527c2.03.59 3.677 2.784 3.677 4.898 0 .4-.09 1.037-.202 1.422l-58.026 199.87c-.59 2.03-2.784 3.677-4.898 3.677-.4 0-1.037-.09-1.422-.202zm-48.447-47.674c-.834.89-2.5 1.612-3.72 1.612-1.115 0-2.677-.618-3.49-1.38L57.611 308.72c-.89-.834-1.613-2.501-1.613-3.721 0-1.219.723-2.886 1.613-3.72l61.262-57.434c.813-.761 2.375-1.38 3.489-1.38 1.22 0 2.886.723 3.72 1.613l18.493 19.724c.761.812 1.38 2.375 1.38 3.488 0 1.273-.776 2.988-1.732 3.83L105.725 305l38.5 33.88c.954.842 1.73 2.557 1.73 3.83 0 1.113-.619 2.676-1.38 3.488zm139.043.232c-.812.762-2.375 1.38-3.488 1.38-1.22 0-2.887-.722-3.72-1.612l-18.493-19.724c-.762-.812-1.38-2.375-1.38-3.488 0-1.273.776-2.988 1.732-3.83L278.276 305l-38.5-33.88c-.954-.842-1.73-2.557-1.73-3.83 0-1.113.619-2.676 1.38-3.488l18.491-19.724c.834-.89 2.501-1.612 3.721-1.612 1.113 0 2.676.618 3.488 1.379l61.262 57.434c.89.834 1.612 2.501 1.612 3.72 0 1.22-.722 2.887-1.612 3.72z"/></svg></span> Libraries</a> <a class="toc-link" href="#papers-list"><span class=" icon-wrapper icon-fa icon-fa-light" data-name="file"><svg viewBox="0 0 384 520.146" xmlns="http://www.w3.org/2000/svg"><path d="M369.9 98.9c9 9 14.1 21.3 14.1 34V465c0 26.5-21.5 48-48 48H48c-26.5 0-48-21.5-48-48V49C0 22.5 21.5 1 48 .9h204.1C264.8.9 277 6 286 15zm-22.6 22.7l-83.899-83.9c-2.1-2.1-4.6-3.5-7.4-4.2V129h95.5c-.7-2.8-2.1-5.3-4.2-7.4zM336 481c8.8 0 16-7.2 16-16V161H248c-13.3 0-24-10.7-24-24V33H48c-8.8 0-16 7.2-16 16v416c0 8.8 7.2 16 16 16h288z"/></svg></span> Papers</a> <a data-call-url="/tasklist/video-generation/greatest" data-target="/task/video-generation" class="toc-papers-button" style="padding-left: 16px;" href="#papers-list">- Most implemented</a> <a data-call-url="/tasklist/video-generation/social" data-target="/task/video-generation/social" class="toc-papers-button" style="padding-left: 16px;" href="#papers-list">- Social</a> <a data-call-url="/tasklist/video-generation/latest" data-target="/task/video-generation/latest" class="toc-papers-button" style="padding-left: 16px;" href="#papers-list">- Latest</a> <a data-call-url="/tasklist/video-generation/codeless" data-target="/task/video-generation/codeless" class="toc-papers-button" style="padding-left: 16px;" href="#papers-list">- No code</a> </nav> </div> </div> </main> </div> <div class="footer"> <div class="footer-contact"> <span class="footer-contact-item">Contact us on:</span> <a class="footer-contact-item" href="mailto:hello@paperswithcode.com"> <span class=" icon-wrapper icon-ion" data-name="mail"><svg xmlns="http://www.w3.org/2000/svg" width="512" height="512" viewBox="0 0 512 512"><path d="M424 80H88a56.06 56.06 0 0 0-56 56v240a56.06 56.06 0 0 0 56 56h336a56.06 56.06 0 0 0 56-56V136a56.06 56.06 0 0 0-56-56zm-14.18 92.63l-144 112a16 16 0 0 1-19.64 0l-144-112a16 16 0 1 1 19.64-25.26L256 251.73l134.18-104.36a16 16 0 0 1 19.64 25.26z"/></svg></span> hello@paperswithcode.com </a>. <span class="footer-contact-item"> Papers With Code is a free resource with all data licensed under <a rel="noreferrer" href="https://creativecommons.org/licenses/by-sa/4.0/">CC-BY-SA</a>. </span> </div> <div class="footer-links"> <a href="/site/terms">Terms</a> <a href="/site/data-policy">Data policy</a> <a href="/site/cookies-policy">Cookies policy</a> <a href="/about#team" class="fair-logo"> from <img src="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAANAAAAAgCAMAAABU6AZfAAAABGdBTUEAALGPC/xhBQAAAAFzUkdCAK7OHOkAAAAJcEhZcwAAFiUAABYlAUlSJPAAAABFUExURUdwTBwqMhwqMxsqMhkqMxsqMhwqMgCA+hwrMxJIgBsrMxsqMgJ28AF58wF38BsqMwB58hsqMwF17wF07hwrMwRm4QJz7Wj6SIIAAAAUdFJOUwDP87wcPIT+4A1tVti1Ta0smZVzG3JP8wAABR9JREFUWMO1memWpCoMgF0QxX1//0e9kCAkAadq5tzKjzndQmM+szNFEWQ9puu6xn02BXm4j23bTsdapKJAMguFgRVT/Ejyx4uH5hgvL1PUfm69jEd6bN05GTJvXF5X/hfRcPyWe2kTLDFdRA4ENVMbZZJGMt3ppEttNMDC2X/Qa7MK1OrveZoKz2/445I+U4znuvaExxKZLFCqtym/A6rzn+OjbHj8ubwDmfESslvtgWea13WeckQPUKJTf/4USHkDnVXzCrT74DnmeX+8rjgcxA4QBmPpyAKdOm+5XwFpgHH/bG9AMzLMqM9DxxCQaM0qLr7U4xE/AgIDVRBHlcoDeYd7lFee6GZOBvaaskD8S6nut0Dg0ItZEt+IQAfjseIzRDvS/WCxWQJ17phqEGqepQBS/VaXZa0H/4XUYMVt6nr309DEjYvduPT2gWELQTr0iQbC1+SADOg/kjVvspGqX6zSRAgEKbqOf6zgd82AVB+8s0YNm5NL6Y8MGzttwKt0krP9+9A/+hzQTALoUX5MnxW7iCIEUmD7IVZb8G0G1HRE9UqbWKkEUFPSR0MWqH5eB65XmgzQdN3WGjxReROxPD2LROeBIEiD7UGLraBAjMcS9W9AquTPckBgoMqEWG1SIGN57otn5KO9Y30N4rq6MQFC5TX1cEWBfJLY+mbQ5ZMUm8UK7F1A9GNc90T3enkpCZhCdUzfdQq0Wp774gnZao55YU3SgkmAVBez1eDfR4BABd/XqY36ichyaLUnyJZ8jatimUBjqQTouK2M3OGs4miiiduN5bkHCL15C9Zw7heBRMHYSMRxIGyYFsPqpwTqactT8w0P0OSA9iRY9jQvrDyIAhCoAjrrR90I1PNCpcivHEh+cATUmS5xoCaNB3ggMzqgRO/RYPIb1WviDkB4sv22kB8ghQcgUIFWzyUmaQ6kpf5DCoTFh5fwQQCt493e9ypD5Xjq7S5cMQeEubpBf2oKCoSMohPzduBAi2yimhRIc3NvrOd+gCxPexvhcGPM3SRoJpbmIhAGSudTNgNCR+qIRL05UCebsxTIiAYOX6sEkONphRkw9A9ZjADIZIDg857we5MBSiQHVMlWJgXyeTBIyVpGD4RttHC4yVtENHn7K5ASdeM3QGX2sKcKBCBmITYmrGii9TOQT7JYwxOgrhbyby4XJrvs54kuR8vlCg4XEgEOEs8Q8R5DYZboCwEESpTmi/Hhc1Lo8zxPlghZjpbLqWVGUGxSes1y4W2lkkC+Wf0C6GPaxtZo0VQW4nOhsJLqAg01HXqgGN0+083MegKoYLdisbDqzHVG1iZJYe0EUDoB+dj149gDRCCgt2lZ1zA5nhvCyEwvrc/b3N/HiZlMgINmZaR/aX3MJluf7Kepo8+F5tRfUh1wR0odzg8Srnm9w7L5SyB/p6H9Ptt0Vj310ngAlDHbnLo3mGc00sJiQ+4KEM+I8xC7fWv5VGcz3Y0C2ZCa70sgf0tXbnbY1jXpln3W6jYXDG4jNthdrfVWn8n4gAVAZe+0GgaEaeGFx4XRQyTM9yWQnNuIAy5/HPAWPuDJ8Yc66sYvSeY/8dhlYqH0kuQzkFQ03nnHCyI/gtc0GfM7BVPmL5J0yHPkXm6d3u6v/TLw3GL5ayDr6WW47awHYmS1VC+XJOVQcCCZBPk13SCvgmcb8uI/UqjqdvlOlk3j5OU20C0putdO1ZWNo0a8oumXslx0vMYaNrfPURt2hnp5G2rhtsEP5j/3Wqt0fQd1YgAAAABJRU5ErkJggg=="> </a> </div> </div> <script> // MathJax window.MathJax = { tex: { inlineMath: [ ["$", "$"], ["\\(", "\\)"], ], }, }; const mathjaxScript = document.createElement("script"); mathjaxScript.src = "https://production-assets.paperswithcode.com/static/js/mathjax/tex-chtml.js"; document.head.appendChild(mathjaxScript); </script> <script src="https://production-assets.paperswithcode.com/perf/766.4af6b88b.js" defer></script><script src="https://production-assets.paperswithcode.com/perf/2.6da00df7.js" defer></script><script src="https://production-assets.paperswithcode.com/perf/351.a22a9607.js" defer></script><script src="https://production-assets.paperswithcode.com/perf/101.5f271f23.js" defer></script><script src="https://production-assets.paperswithcode.com/perf/view_task.e61ab167.js" defer></script> </body> </html>

Pages: 1 2 3 4 5 6 7 8 9 10