CINXE.COM
Free NLP Datasets for Machine Learning | DagsHub
<!doctype html> <html lang="en-US"> <head> <meta charset="UTF-8"> <meta name="viewport" content="width=device-width, initial-scale=1"> <link rel="profile" href="http://gmpg.org/xfn/11"> <script> // Constants const SIGN_IN_STATUS_ATTRIBUTE = 'data-md-signed-in', SIGNED_IN_STATUS = 'true', SIGNED_OUT_STATUS = 'false'; const SIGN_IN_USERNAME_COOKIE = 'dags_awesome', SIGN_IN_USER_ID_COOKIE = 'ajs_user_id'; const base_url = 'https://dagshub.com', ajax_url = 'https://dagshub.com/wp-admin/admin-ajax.php'; const getCookie = (name) => { let match = document.cookie.match(new RegExp('(^| )' + name + '=([^;]+)')); if (match) return match[2]; }; const is_home = false // Handling Signed in status let username = getCookie(SIGN_IN_USERNAME_COOKIE); let user_id = getCookie(SIGN_IN_USER_ID_COOKIE); if (username && user_id) { // document.body.setAttribute( // SIGN_IN_STATUS_ATTRIBUTE, // SIGNED_IN_STATUS // ); if(is_home){ location.replace(base_url+"/dashboard"); } // $('.profile-menu .avatar').attr("src", "/avatars/" + user_id); // $('.profile-menu .name').text(username); // $('#user-profile-link').attr("href", "/" + username); } else { document.body.setAttribute( SIGN_IN_STATUS_ATTRIBUTE, SIGNED_OUT_STATUS ); } </script> <meta name='robots' content='index, follow, max-image-preview:large, max-snippet:-1, max-video-preview:-1' /> <!-- This site is optimized with the Yoast SEO plugin v23.4 - https://yoast.com/wordpress/plugins/seo/ --> <title>Free NLP Datasets for Machine Learning | DagsHub</title> <meta name="description" content="Save time searching for quality NLP training data. Here are free open NLP datasets to develop and train ML models." /> <link rel="canonical" href="https://dagshub.com/datasets/nlp/" /> <meta property="og:locale" content="en_US" /> <meta property="og:type" content="article" /> <meta property="og:title" content="Free NLP Datasets for Machine Learning | DagsHub" /> <meta property="og:description" content="Save time searching for quality NLP training data. Here are free open NLP datasets to develop and train ML models." /> <meta property="og:url" content="https://dagshub.com/datasets/nlp/" /> <meta property="og:site_name" content="DagsHub" /> <meta property="og:image" content="https://dagshub.com/wp-content/uploads/2023/02/Datasets-OG-Image.jpg" /> <meta property="og:image:width" content="1200" /> <meta property="og:image:height" content="630" /> <meta property="og:image:type" content="image/jpeg" /> <meta name="twitter:card" content="summary_large_image" /> <meta name="twitter:image" content="https://dagshub.com/wp-content/uploads/2023/02/Datasets-OG-Image.jpg" /> <meta name="twitter:site" content="@TheRealDagsHub" /> <script type="application/ld+json" class="yoast-schema-graph">{"@context":"https://schema.org","@graph":[{"@type":"CollectionPage","@id":"https://dagshub.com/datasets/nlp/","url":"https://dagshub.com/datasets/nlp/","name":"Free NLP Datasets for Machine Learning | DagsHub","isPartOf":{"@id":"https://dagshub.com/#website"},"description":"Save time searching for quality NLP training data. Here are free open NLP datasets to develop and train ML models.","inLanguage":"en-US"},{"@type":"WebSite","@id":"https://dagshub.com/#website","url":"https://dagshub.com/","name":"DagsHub","description":"","publisher":{"@id":"https://dagshub.com/#organization"},"potentialAction":[{"@type":"SearchAction","target":{"@type":"EntryPoint","urlTemplate":"https://dagshub.com/?s={search_term_string}"},"query-input":{"@type":"PropertyValueSpecification","valueRequired":true,"valueName":"search_term_string"}}],"inLanguage":"en-US"},{"@type":"Organization","@id":"https://dagshub.com/#organization","name":"DagsHub","url":"https://dagshub.com/","logo":{"@type":"ImageObject","inLanguage":"en-US","@id":"https://dagshub.com/#/schema/logo/image/","url":"https://dagshub.com/wp-content/uploads/2024/04/dagshab.svg","contentUrl":"https://dagshub.com/wp-content/uploads/2024/04/dagshab.svg","width":143,"height":40,"caption":"DagsHub"},"image":{"@id":"https://dagshub.com/#/schema/logo/image/"},"sameAs":["https://x.com/TheRealDagsHub","https://www.linkedin.com/company/dagshub"]}]}</script> <!-- / Yoast SEO plugin. --> <link rel='dns-prefetch' href='//dagshub.com' /> <link rel="alternate" type="application/rss+xml" title="DagsHub » Feed" href="https://dagshub.com/feed/" /> <link rel="alternate" type="application/rss+xml" title="DagsHub » Comments Feed" href="https://dagshub.com/comments/feed/" /> <link rel="alternate" type="application/rss+xml" title="DagsHub » NLP Dataset Category Feed" href="https://dagshub.com/datasets/nlp/feed/" /> <script> window._wpemojiSettings = {"baseUrl":"https:\/\/s.w.org\/images\/core\/emoji\/15.0.3\/72x72\/","ext":".png","svgUrl":"https:\/\/s.w.org\/images\/core\/emoji\/15.0.3\/svg\/","svgExt":".svg","source":{"concatemoji":"https:\/\/dagshub.com\/wp-includes\/js\/wp-emoji-release.min.js?ver=4e55ae54fa701286f578c2d0b9d76284"}}; /*! This file is auto-generated */ !function(i,n){var o,s,e;function c(e){try{var t={supportTests:e,timestamp:(new Date).valueOf()};sessionStorage.setItem(o,JSON.stringify(t))}catch(e){}}function p(e,t,n){e.clearRect(0,0,e.canvas.width,e.canvas.height),e.fillText(t,0,0);var t=new Uint32Array(e.getImageData(0,0,e.canvas.width,e.canvas.height).data),r=(e.clearRect(0,0,e.canvas.width,e.canvas.height),e.fillText(n,0,0),new Uint32Array(e.getImageData(0,0,e.canvas.width,e.canvas.height).data));return t.every(function(e,t){return e===r[t]})}function u(e,t,n){switch(t){case"flag":return n(e,"\ud83c\udff3\ufe0f\u200d\u26a7\ufe0f","\ud83c\udff3\ufe0f\u200b\u26a7\ufe0f")?!1:!n(e,"\ud83c\uddfa\ud83c\uddf3","\ud83c\uddfa\u200b\ud83c\uddf3")&&!n(e,"\ud83c\udff4\udb40\udc67\udb40\udc62\udb40\udc65\udb40\udc6e\udb40\udc67\udb40\udc7f","\ud83c\udff4\u200b\udb40\udc67\u200b\udb40\udc62\u200b\udb40\udc65\u200b\udb40\udc6e\u200b\udb40\udc67\u200b\udb40\udc7f");case"emoji":return!n(e,"\ud83d\udc26\u200d\u2b1b","\ud83d\udc26\u200b\u2b1b")}return!1}function f(e,t,n){var r="undefined"!=typeof WorkerGlobalScope&&self instanceof WorkerGlobalScope?new OffscreenCanvas(300,150):i.createElement("canvas"),a=r.getContext("2d",{willReadFrequently:!0}),o=(a.textBaseline="top",a.font="600 32px Arial",{});return e.forEach(function(e){o[e]=t(a,e,n)}),o}function t(e){var t=i.createElement("script");t.src=e,t.defer=!0,i.head.appendChild(t)}"undefined"!=typeof Promise&&(o="wpEmojiSettingsSupports",s=["flag","emoji"],n.supports={everything:!0,everythingExceptFlag:!0},e=new Promise(function(e){i.addEventListener("DOMContentLoaded",e,{once:!0})}),new Promise(function(t){var n=function(){try{var e=JSON.parse(sessionStorage.getItem(o));if("object"==typeof e&&"number"==typeof e.timestamp&&(new Date).valueOf()<e.timestamp+604800&&"object"==typeof e.supportTests)return e.supportTests}catch(e){}return null}();if(!n){if("undefined"!=typeof Worker&&"undefined"!=typeof OffscreenCanvas&&"undefined"!=typeof URL&&URL.createObjectURL&&"undefined"!=typeof Blob)try{var e="postMessage("+f.toString()+"("+[JSON.stringify(s),u.toString(),p.toString()].join(",")+"));",r=new Blob([e],{type:"text/javascript"}),a=new Worker(URL.createObjectURL(r),{name:"wpTestEmojiSupports"});return void(a.onmessage=function(e){c(n=e.data),a.terminate(),t(n)})}catch(e){}c(n=f(s,u,p))}t(n)}).then(function(e){for(var t in e)n.supports[t]=e[t],n.supports.everything=n.supports.everything&&n.supports[t],"flag"!==t&&(n.supports.everythingExceptFlag=n.supports.everythingExceptFlag&&n.supports[t]);n.supports.everythingExceptFlag=n.supports.everythingExceptFlag&&!n.supports.flag,n.DOMReady=!1,n.readyCallback=function(){n.DOMReady=!0}}).then(function(){return e}).then(function(){var e;n.supports.everything||(n.readyCallback(),(e=n.source||{}).concatemoji?t(e.concatemoji):e.wpemoji&&e.twemoji&&(t(e.twemoji),t(e.wpemoji)))}))}((window,document),window._wpemojiSettings); </script> <link rel='stylesheet' id='block-editor-styles-css' href='https://dagshub.com/wp-content/themes/wp-d-theme/css/prod/editor.css?ver=1732810781' type='text/css' media='all' /> <style id='wp-emoji-styles-inline-css' type='text/css'> img.wp-smiley, img.emoji { display: inline !important; border: none !important; box-shadow: none !important; height: 1em !important; width: 1em !important; margin: 0 0.07em !important; vertical-align: -0.1em !important; background: none !important; padding: 0 !important; } </style> <link rel='stylesheet' id='wp-block-library-css' href='https://dagshub.com/wp-includes/css/dist/block-library/style.min.css?ver=4e55ae54fa701286f578c2d0b9d76284' type='text/css' media='all' /> <style id='wp-block-library-theme-inline-css' type='text/css'> .wp-block-audio :where(figcaption){color:#555;font-size:13px;text-align:center}.is-dark-theme .wp-block-audio :where(figcaption){color:#ffffffa6}.wp-block-audio{margin:0 0 1em}.wp-block-code{border:1px solid #ccc;border-radius:4px;font-family:Menlo,Consolas,monaco,monospace;padding:.8em 1em}.wp-block-embed :where(figcaption){color:#555;font-size:13px;text-align:center}.is-dark-theme .wp-block-embed :where(figcaption){color:#ffffffa6}.wp-block-embed{margin:0 0 1em}.blocks-gallery-caption{color:#555;font-size:13px;text-align:center}.is-dark-theme .blocks-gallery-caption{color:#ffffffa6}:root :where(.wp-block-image figcaption){color:#555;font-size:13px;text-align:center}.is-dark-theme :root :where(.wp-block-image figcaption){color:#ffffffa6}.wp-block-image{margin:0 0 1em}.wp-block-pullquote{border-bottom:4px solid;border-top:4px solid;color:currentColor;margin-bottom:1.75em}.wp-block-pullquote cite,.wp-block-pullquote footer,.wp-block-pullquote__citation{color:currentColor;font-size:.8125em;font-style:normal;text-transform:uppercase}.wp-block-quote{border-left:.25em solid;margin:0 0 1.75em;padding-left:1em}.wp-block-quote cite,.wp-block-quote footer{color:currentColor;font-size:.8125em;font-style:normal;position:relative}.wp-block-quote.has-text-align-right{border-left:none;border-right:.25em solid;padding-left:0;padding-right:1em}.wp-block-quote.has-text-align-center{border:none;padding-left:0}.wp-block-quote.is-large,.wp-block-quote.is-style-large,.wp-block-quote.is-style-plain{border:none}.wp-block-search .wp-block-search__label{font-weight:700}.wp-block-search__button{border:1px solid #ccc;padding:.375em .625em}:where(.wp-block-group.has-background){padding:1.25em 2.375em}.wp-block-separator.has-css-opacity{opacity:.4}.wp-block-separator{border:none;border-bottom:2px solid;margin-left:auto;margin-right:auto}.wp-block-separator.has-alpha-channel-opacity{opacity:1}.wp-block-separator:not(.is-style-wide):not(.is-style-dots){width:100px}.wp-block-separator.has-background:not(.is-style-dots){border-bottom:none;height:1px}.wp-block-separator.has-background:not(.is-style-wide):not(.is-style-dots){height:2px}.wp-block-table{margin:0 0 1em}.wp-block-table td,.wp-block-table th{word-break:normal}.wp-block-table :where(figcaption){color:#555;font-size:13px;text-align:center}.is-dark-theme .wp-block-table :where(figcaption){color:#ffffffa6}.wp-block-video :where(figcaption){color:#555;font-size:13px;text-align:center}.is-dark-theme .wp-block-video :where(figcaption){color:#ffffffa6}.wp-block-video{margin:0 0 1em}:root :where(.wp-block-template-part.has-background){margin-bottom:0;margin-top:0;padding:1.25em 2.375em} </style> <style id='safe-svg-svg-icon-style-inline-css' type='text/css'> .safe-svg-cover{text-align:center}.safe-svg-cover .safe-svg-inside{display:inline-block;max-width:100%}.safe-svg-cover svg{height:100%;max-height:100%;max-width:100%;width:100%} </style> <style id='classic-theme-styles-inline-css' type='text/css'> /*! This file is auto-generated */ .wp-block-button__link{color:#fff;background-color:#32373c;border-radius:9999px;box-shadow:none;text-decoration:none;padding:calc(.667em + 2px) calc(1.333em + 2px);font-size:1.125em}.wp-block-file__button{background:#32373c;color:#fff;text-decoration:none} </style> <style id='global-styles-inline-css' type='text/css'> :root{--wp--preset--aspect-ratio--square: 1;--wp--preset--aspect-ratio--4-3: 4/3;--wp--preset--aspect-ratio--3-4: 3/4;--wp--preset--aspect-ratio--3-2: 3/2;--wp--preset--aspect-ratio--2-3: 2/3;--wp--preset--aspect-ratio--16-9: 16/9;--wp--preset--aspect-ratio--9-16: 9/16;--wp--preset--color--black: #000000;--wp--preset--color--cyan-bluish-gray: #abb8c3;--wp--preset--color--white: #ffffff;--wp--preset--color--pale-pink: #f78da7;--wp--preset--color--vivid-red: #cf2e2e;--wp--preset--color--luminous-vivid-orange: #ff6900;--wp--preset--color--luminous-vivid-amber: #fcb900;--wp--preset--color--light-green-cyan: #7bdcb5;--wp--preset--color--vivid-green-cyan: #00d084;--wp--preset--color--pale-cyan-blue: #8ed1fc;--wp--preset--color--vivid-cyan-blue: #0693e3;--wp--preset--color--vivid-purple: #9b51e0;--wp--preset--color--eeee-22: #eeee22;--wp--preset--color--81-d-742: #81d742;--wp--preset--color--1-e-73-be: #1e73be;--wp--preset--color--8224-e-3: #8224e3;--wp--preset--color--6-b-6-b-6-b: #6b6b6b;--wp--preset--gradient--vivid-cyan-blue-to-vivid-purple: linear-gradient(135deg,rgba(6,147,227,1) 0%,rgb(155,81,224) 100%);--wp--preset--gradient--light-green-cyan-to-vivid-green-cyan: linear-gradient(135deg,rgb(122,220,180) 0%,rgb(0,208,130) 100%);--wp--preset--gradient--luminous-vivid-amber-to-luminous-vivid-orange: linear-gradient(135deg,rgba(252,185,0,1) 0%,rgba(255,105,0,1) 100%);--wp--preset--gradient--luminous-vivid-orange-to-vivid-red: linear-gradient(135deg,rgba(255,105,0,1) 0%,rgb(207,46,46) 100%);--wp--preset--gradient--very-light-gray-to-cyan-bluish-gray: linear-gradient(135deg,rgb(238,238,238) 0%,rgb(169,184,195) 100%);--wp--preset--gradient--cool-to-warm-spectrum: linear-gradient(135deg,rgb(74,234,220) 0%,rgb(151,120,209) 20%,rgb(207,42,186) 40%,rgb(238,44,130) 60%,rgb(251,105,98) 80%,rgb(254,248,76) 100%);--wp--preset--gradient--blush-light-purple: linear-gradient(135deg,rgb(255,206,236) 0%,rgb(152,150,240) 100%);--wp--preset--gradient--blush-bordeaux: linear-gradient(135deg,rgb(254,205,165) 0%,rgb(254,45,45) 50%,rgb(107,0,62) 100%);--wp--preset--gradient--luminous-dusk: linear-gradient(135deg,rgb(255,203,112) 0%,rgb(199,81,192) 50%,rgb(65,88,208) 100%);--wp--preset--gradient--pale-ocean: linear-gradient(135deg,rgb(255,245,203) 0%,rgb(182,227,212) 50%,rgb(51,167,181) 100%);--wp--preset--gradient--electric-grass: linear-gradient(135deg,rgb(202,248,128) 0%,rgb(113,206,126) 100%);--wp--preset--gradient--midnight: linear-gradient(135deg,rgb(2,3,129) 0%,rgb(40,116,252) 100%);--wp--preset--font-size--small: 13px;--wp--preset--font-size--medium: 20px;--wp--preset--font-size--large: 36px;--wp--preset--font-size--x-large: 42px;--wp--preset--spacing--20: 0.44rem;--wp--preset--spacing--30: 0.67rem;--wp--preset--spacing--40: 1rem;--wp--preset--spacing--50: 1.5rem;--wp--preset--spacing--60: 2.25rem;--wp--preset--spacing--70: 3.38rem;--wp--preset--spacing--80: 5.06rem;--wp--preset--shadow--natural: 6px 6px 9px rgba(0, 0, 0, 0.2);--wp--preset--shadow--deep: 12px 12px 50px rgba(0, 0, 0, 0.4);--wp--preset--shadow--sharp: 6px 6px 0px rgba(0, 0, 0, 0.2);--wp--preset--shadow--outlined: 6px 6px 0px -3px rgba(255, 255, 255, 1), 6px 6px rgba(0, 0, 0, 1);--wp--preset--shadow--crisp: 6px 6px 0px rgba(0, 0, 0, 1);}:where(.is-layout-flex){gap: 0.5em;}:where(.is-layout-grid){gap: 0.5em;}body .is-layout-flex{display: flex;}.is-layout-flex{flex-wrap: wrap;align-items: center;}.is-layout-flex > :is(*, div){margin: 0;}body .is-layout-grid{display: grid;}.is-layout-grid > :is(*, div){margin: 0;}:where(.wp-block-columns.is-layout-flex){gap: 2em;}:where(.wp-block-columns.is-layout-grid){gap: 2em;}:where(.wp-block-post-template.is-layout-flex){gap: 1.25em;}:where(.wp-block-post-template.is-layout-grid){gap: 1.25em;}.has-black-color{color: var(--wp--preset--color--black) !important;}.has-cyan-bluish-gray-color{color: var(--wp--preset--color--cyan-bluish-gray) !important;}.has-white-color{color: var(--wp--preset--color--white) !important;}.has-pale-pink-color{color: var(--wp--preset--color--pale-pink) !important;}.has-vivid-red-color{color: var(--wp--preset--color--vivid-red) !important;}.has-luminous-vivid-orange-color{color: var(--wp--preset--color--luminous-vivid-orange) !important;}.has-luminous-vivid-amber-color{color: var(--wp--preset--color--luminous-vivid-amber) !important;}.has-light-green-cyan-color{color: var(--wp--preset--color--light-green-cyan) !important;}.has-vivid-green-cyan-color{color: var(--wp--preset--color--vivid-green-cyan) !important;}.has-pale-cyan-blue-color{color: var(--wp--preset--color--pale-cyan-blue) !important;}.has-vivid-cyan-blue-color{color: var(--wp--preset--color--vivid-cyan-blue) !important;}.has-vivid-purple-color{color: var(--wp--preset--color--vivid-purple) !important;}.has-black-background-color{background-color: var(--wp--preset--color--black) !important;}.has-cyan-bluish-gray-background-color{background-color: var(--wp--preset--color--cyan-bluish-gray) !important;}.has-white-background-color{background-color: var(--wp--preset--color--white) !important;}.has-pale-pink-background-color{background-color: var(--wp--preset--color--pale-pink) !important;}.has-vivid-red-background-color{background-color: var(--wp--preset--color--vivid-red) !important;}.has-luminous-vivid-orange-background-color{background-color: var(--wp--preset--color--luminous-vivid-orange) !important;}.has-luminous-vivid-amber-background-color{background-color: var(--wp--preset--color--luminous-vivid-amber) !important;}.has-light-green-cyan-background-color{background-color: var(--wp--preset--color--light-green-cyan) !important;}.has-vivid-green-cyan-background-color{background-color: var(--wp--preset--color--vivid-green-cyan) !important;}.has-pale-cyan-blue-background-color{background-color: var(--wp--preset--color--pale-cyan-blue) !important;}.has-vivid-cyan-blue-background-color{background-color: var(--wp--preset--color--vivid-cyan-blue) !important;}.has-vivid-purple-background-color{background-color: var(--wp--preset--color--vivid-purple) !important;}.has-black-border-color{border-color: var(--wp--preset--color--black) !important;}.has-cyan-bluish-gray-border-color{border-color: var(--wp--preset--color--cyan-bluish-gray) !important;}.has-white-border-color{border-color: var(--wp--preset--color--white) !important;}.has-pale-pink-border-color{border-color: var(--wp--preset--color--pale-pink) !important;}.has-vivid-red-border-color{border-color: var(--wp--preset--color--vivid-red) !important;}.has-luminous-vivid-orange-border-color{border-color: var(--wp--preset--color--luminous-vivid-orange) !important;}.has-luminous-vivid-amber-border-color{border-color: var(--wp--preset--color--luminous-vivid-amber) !important;}.has-light-green-cyan-border-color{border-color: var(--wp--preset--color--light-green-cyan) !important;}.has-vivid-green-cyan-border-color{border-color: var(--wp--preset--color--vivid-green-cyan) !important;}.has-pale-cyan-blue-border-color{border-color: var(--wp--preset--color--pale-cyan-blue) !important;}.has-vivid-cyan-blue-border-color{border-color: var(--wp--preset--color--vivid-cyan-blue) !important;}.has-vivid-purple-border-color{border-color: var(--wp--preset--color--vivid-purple) !important;}.has-vivid-cyan-blue-to-vivid-purple-gradient-background{background: var(--wp--preset--gradient--vivid-cyan-blue-to-vivid-purple) !important;}.has-light-green-cyan-to-vivid-green-cyan-gradient-background{background: var(--wp--preset--gradient--light-green-cyan-to-vivid-green-cyan) !important;}.has-luminous-vivid-amber-to-luminous-vivid-orange-gradient-background{background: var(--wp--preset--gradient--luminous-vivid-amber-to-luminous-vivid-orange) !important;}.has-luminous-vivid-orange-to-vivid-red-gradient-background{background: var(--wp--preset--gradient--luminous-vivid-orange-to-vivid-red) !important;}.has-very-light-gray-to-cyan-bluish-gray-gradient-background{background: var(--wp--preset--gradient--very-light-gray-to-cyan-bluish-gray) !important;}.has-cool-to-warm-spectrum-gradient-background{background: var(--wp--preset--gradient--cool-to-warm-spectrum) !important;}.has-blush-light-purple-gradient-background{background: var(--wp--preset--gradient--blush-light-purple) !important;}.has-blush-bordeaux-gradient-background{background: var(--wp--preset--gradient--blush-bordeaux) !important;}.has-luminous-dusk-gradient-background{background: var(--wp--preset--gradient--luminous-dusk) !important;}.has-pale-ocean-gradient-background{background: var(--wp--preset--gradient--pale-ocean) !important;}.has-electric-grass-gradient-background{background: var(--wp--preset--gradient--electric-grass) !important;}.has-midnight-gradient-background{background: var(--wp--preset--gradient--midnight) !important;}.has-small-font-size{font-size: var(--wp--preset--font-size--small) !important;}.has-medium-font-size{font-size: var(--wp--preset--font-size--medium) !important;}.has-large-font-size{font-size: var(--wp--preset--font-size--large) !important;}.has-x-large-font-size{font-size: var(--wp--preset--font-size--x-large) !important;} :where(.wp-block-post-template.is-layout-flex){gap: 1.25em;}:where(.wp-block-post-template.is-layout-grid){gap: 1.25em;} :where(.wp-block-columns.is-layout-flex){gap: 2em;}:where(.wp-block-columns.is-layout-grid){gap: 2em;} :root :where(.wp-block-pullquote){font-size: 1.5em;line-height: 1.6;} </style> <link rel='stylesheet' id='contact-form-7-css' href='https://dagshub.com/wp-content/plugins/contact-form-7/includes/css/styles.css?ver=5.9.8' type='text/css' media='all' /> <link rel='stylesheet' id='styles-css' href='https://dagshub.com/wp-content/themes/wp-d-theme/css/prod/main.css?ver=1732811207' type='text/css' media='all' /> <link rel='stylesheet' id='new-style-css' href='https://dagshub.com/wp-content/themes/wp-d-theme/css/prod/new-style.css?ver=1732811209' type='text/css' media='all' /> <link rel='stylesheet' id='main-theme-style-css' href='https://dagshub.com/wp-content/themes/wp-d-theme/style.css?ver=1724943191' type='text/css' media='all' /> <link rel='stylesheet' id='fancybox-css' href='https://dagshub.com/wp-content/themes/wp-d-theme/vendors/fancybox/fancybox.css?ver=4.0.31' type='text/css' media='all' /> <link rel="https://api.w.org/" href="https://dagshub.com/wp-json/" /><link rel="alternate" title="JSON" type="application/json" href="https://dagshub.com/wp-json/wp/v2/dataset_category/7" /><link rel="EditURI" type="application/rsd+xml" title="RSD" href="https://dagshub.com/xmlrpc.php?rsd" /> <!-- Google Tag Manager --> <script>(function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start': new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0], j=d.createElement(s),dl=l!='dataLayer'?'&l='+l:'';j.async=true;j.src= 'https://www.googletagmanager.com/gtm.js?id='+i+dl;f.parentNode.insertBefore(j,f); })(window,document,'script','dataLayer','GTM-PGHTMDN');</script> <!-- End Google Tag Manager --> <link rel="icon" href="https://dagshub.com/wp-content/uploads/2023/01/cropped-DH-Logo-512x512-3-32x32.png" sizes="32x32" /> <link rel="icon" href="https://dagshub.com/wp-content/uploads/2023/01/cropped-DH-Logo-512x512-3-192x192.png" sizes="192x192" /> <link rel="apple-touch-icon" href="https://dagshub.com/wp-content/uploads/2023/01/cropped-DH-Logo-512x512-3-180x180.png" /> <meta name="msapplication-TileImage" content="https://dagshub.com/wp-content/uploads/2023/01/cropped-DH-Logo-512x512-3-270x270.png" /> <style id="wp-custom-css"> .c-glossary__thumb{ top:0px; left:0px; } .header__actions .c-buttons { margin-top: 0; } .grecaptcha-badge{ visibility: hidden; } .home .site-head{ background-color:rgba(0,0,0,.0); } body:not(.home){ margin-top:68px; } body .site .main { padding-top: 0; } body:not(.home) .site { padding-top: 0px; } .home .site-head.site-head__scrolled{ background-color:#090819; } .logos-gallery .main-gallery .main-gallery__row .gallery-item img{ max-height:66px; max-width:155px; object-fit: contain; } #wpcf7-f2379-p2377-o1 .c-form-primary__field:has(.wpcf7-not-valid) .wpcf7-not-valid-tip { display: block; } @media only screen and (max-width: 1280px) { .logos-gallery .main-gallery .main-gallery__row .gallery-item img{ max-width:120px; max-height:55px; } } @media only screen and (max-width: 1199px) { .head-nav a:not(.btn) { display: block; } .head-nav a:not(.btn) .menu-item__text{ display:block; } .head-nav .sub-menu a:not(.btn) .menu-item__text{ display:inline-flex; } } @media only screen and (max-width: 1026px) { .canvas-animation--bg, .canvas-animation--bg canvas{ pointer-events:none; } .logos-gallery .main-gallery .main-gallery__row .gallery-item img{ max-width:90px; max-height:40px; } .home-hero-block .title__gradient div { -webkit-text-fill-color: #0000; background: linear-gradient(180deg, #fff 17.78%, #ffffff1a 191.11%); background-clip: text; -webkit-background-clip: text; pointer-events: none; } } @media only screen and (min-width: 1441px) { .site-head__nav { margin-right: auto; margin-right: auto; } } </style> </head> <body class="archive tax-dataset_category term-nlp term-7 wp-custom-logo no-js"> <a class="skip-link screen-reader-text js-trigger" href="#content">Skip to content</a> <!-- Google Tag Manager (noscript) --> <noscript><iframe src="https://www.googletagmanager.com/ns.html?id=GTM-PGHTMDN" height="0" width="0" style="display:none;visibility:hidden"></iframe></noscript> <!-- End Google Tag Manager (noscript) --> <div id="page" class="site"> <header class="site-head site-head__bacground" role="banner" itemscope="itemscope" itemtype="http://schema.org/WPHeader"> <div class="site-head__wrap"> <div class="container container-lg"> <div class="site-head__frame"> <!-- Custom logo and site title. --> <div class="site-logo"> <a href="https://dagshub.com/" class="custom-logo-link" rel="home"><img width="143" height="40" src="https://dagshub.com/wp-content/uploads/2024/04/dagshab.svg" class="custom-logo" alt="DagsHub" decoding="async" /></a> <span class="screen-reader-text" itemprop="name">DagsHub</span> </div> <button class="nav-opener" aria-label="nav opener"><span><em>Menu</em></span></button> <div class="site-head__holder"> <!-- Main menu. --> <nav class="site-head__nav js-header-menu-item" role="navigation" itemscope="itemscope" itemtype="http://schema.org/SiteNavigationElement"> <ul class="menu head-nav main-header-menu"><li id="menu-item-2351" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-has-children menu-item-2351"> <div class="menu-item__link menu-item__link--title">Resources</div> <button class="dropdown-toggle" aria-expanded="false"><span class="screen-readers">Expand child menu</span><span class="opener-arrow"><svg class="svg-icon icon-chevron-down" width="20" height="20""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-chevron-down"></use></svg></span></button> <ul class="sub-menu level0"> <li id="menu-item-2357" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2357"> <a href="https://dagshub.com/blog/" class="menu-item__link" ><span class="menu-item__text">Blog</span></a> </li> <li id="menu-item-2358" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2358"> <a href="https://dagshub.com/datasets/" class="menu-item__link" ><span class="menu-item__text">Datasets</span></a> </li> <li id="menu-item-2359" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2359"> <a href="https://dagshub.com/glossary/" class="menu-item__link" ><span class="menu-item__text">Glossary</span></a> </li> <li id="menu-item-2360" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2360"> <a href="https://dagshub.com/blog/tag/tutorials/" class="menu-item__link" ><span class="menu-item__text">Tutorial & Webinars</span></a> </li> </ul> </li> <li id="menu-item-2352" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2352"> <a href="https://dagshub.com/docs" class="menu-item__link" ><span class="menu-item__text">Docs</span></a> </li> <li id="menu-item-2353" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-has-children menu-item-2353"> <div class="menu-item__link menu-item__link--title">Product</div> <button class="dropdown-toggle" aria-expanded="false"><span class="screen-readers">Expand child menu</span><span class="opener-arrow"><svg class="svg-icon icon-chevron-down" width="20" height="20""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-chevron-down"></use></svg></span></button> <ul class="sub-menu level0"> <li id="menu-item-2361" class="menu-item menu-item-type-post_type menu-item-object-page menu-item-2361"> <a href="https://dagshub.com/data-engine/" class="menu-item__link" ><span class="menu-item__text"><span class="icon-image"><svg class="svg-icon icon-data-engine" width="20" height="20""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-data-engine"></use></svg></span><span class="menu-text-wrapper"><span class="menu-text">Data engine</span><span class="menu-description">Manage your unstructured data</span></span></span></a> </li> <li id="menu-item-2362" class="menu-item menu-item-type-post_type menu-item-object-page menu-item-2362"> <a href="https://dagshub.com/use-cases/llm/" class="menu-item__link" ><span class="menu-item__text"><span class="icon-image"><svg class="svg-icon icon-llms" width="20" height="20""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-llms"></use></svg></span><span class="menu-text-wrapper"><span class="menu-text">LLMs</span><span class="menu-description">Build LLM projects quickly</span></span></span></a> </li> <li id="menu-item-2363" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2363"> <a href="https://dagshub.com/product/" class="menu-item__link" ><span class="menu-item__text"><span class="icon-image"><svg class="svg-icon icon-linear-search" width="20" height="20""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-linear-search"></use></svg></span><span class="menu-text-wrapper"><span class="menu-text">Overview</span><span class="menu-description">Organize your entire project under one roof</span></span></span></a> </li> <li id="menu-item-2364" class="menu-item menu-item-type-post_type menu-item-object-page menu-item-2364"> <a href="https://dagshub.com/enterprise/" class="menu-item__link" ><span class="menu-item__text"><span class="icon-image"><svg class="svg-icon icon-enterprise" width="20" height="20""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-enterprise"></use></svg></span><span class="menu-text-wrapper"><span class="menu-text">Enterprise</span><span class="menu-description">A single source of truth for your organization</span></span></span></a> </li> </ul> </li> <li id="menu-item-2354" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2354"> <a href="/enterprise/" class="menu-item__link" ><span class="menu-item__text">Enterprise</span></a> </li> <li id="menu-item-2355" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2355"> <a href="https://dagshub.com/pricing" class="menu-item__link" ><span class="menu-item__text">Pricing</span></a> </li> <li id="menu-item-2356" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-has-children menu-item-2356"> <div class="menu-item__link menu-item__link--title">Company</div> <button class="dropdown-toggle" aria-expanded="false"><span class="screen-readers">Expand child menu</span><span class="opener-arrow"><svg class="svg-icon icon-chevron-down" width="20" height="20""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-chevron-down"></use></svg></span></button> <ul class="sub-menu level0"> <li id="menu-item-2365" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2365"> <a href="https://dagshub.com/about" class="menu-item__link" ><span class="menu-item__text">About</span></a> </li> <li id="menu-item-2366" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2366"> <a href="https://dagshub.com/careers" class="menu-item__link" ><span class="menu-item__text">Careers</span></a> </li> <li id="menu-item-2367" class="menu-item menu-item-type-post_type menu-item-object-page menu-item-2367"> <a href="https://dagshub.com/contact-us/" class="menu-item__link" ><span class="menu-item__text">Contact us</span></a> </li> </ul> </li> </ul> </nav> <div class="site-head__tools"> <ul class="menu head-nav main-header-menu"><li id="menu-item-2372" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2372"><a rel="Navbar_Login_Clicked" href="https://dagshub.com/user/login" class="menu-item__link">Log in</a></li> <li id="menu-item-2389" class="menu-item menu-item-type-post_type menu-item-object-page menu-item-2389"><a rel="Navbar_BookADemo_Clicked" href="https://dagshub.com/book-a-demo/" class="menu-item__button btn btn--primary"><span class="btn__text">Book a demo</span></a></li> </ul> </div> </div> </div> </div> </div> </header> <div class="wrapper__body no-overlap"> <main class="main"> <section class="c-block b-block-common b-block-nlp"> <div class="container b-block-common__container"> <div class="b-block-common__head"> <div class="b-block-common__head-actions"> <a href="https://dagshub.com/datasets/" class="c-btn c-btn-light c-btn-icon-left"><svg height="800px" width="800px" version="1.1" id="Layer_1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" viewBox="0 0 495 495" xml:space="preserve"><g><polygon style="fill: currentColor;" points="247.5,334.58 291.894,379.119 320.224,350.881 247.5,277.92 217.179,247.5 247.5,217.08 320.224,144.119 291.894,115.881 247.5,160.419 160.703,247.5"/></g></svg> Explore other datasets</a> </div> <div class="b-block-common__head-title"> <div class="b-block-common__head-title_icon"> <img width="28" height="28" src="https://dagshub.com/wp-content/uploads/2023/02/NLP-1.svg" class="" alt="" decoding="async" /> </div> <h1 class="c-title b-block-common__title default" > <span style="font-weight: 400;"> NLP Datasets</span><br /> </h1> </div> <div class="c-text b-block-common__text c-text--list-style-" > <p>Natural language processing (NLP) is transforming the way we interact with technology. With the ability to understand and generate human language, NLP is making it possible for computers to understand our thoughts and emotions. Whether it’s voice assistants, chatbots, or text-based communication, NLP is revolutionizing the way we communicate with machines. Join the NLP revolution and experience the power of human language technology.</p> </div> <div class="c-dataset-search " data-per-page="20"> <div class="c-dataset-search__head"> <h5 class="c-dataset-search__label c-dataset-search__label--title">Search datasets: </h5> </div> <div class="c-dataset-search__body"> <div class="c-dataset-search__field"> <input type="search" placeholder="Enter dataset name" class="c-dataset-search__field-input" /> <div class="c-dataset-search__field-icon"> <i class="c-dataset-search__field-icon-open"> <svg width="18" height="18" viewBox="0 0 18 18" fill="none" xmlns="http://www.w3.org/2000/svg"><path fill-rule="evenodd" clip-rule="evenodd" d="M7.33317 2.33341C4.57175 2.33341 2.33317 4.57199 2.33317 7.33342C2.33317 10.0948 4.57175 12.3334 7.33317 12.3334C10.0946 12.3334 12.3332 10.0948 12.3332 7.33342C12.3332 4.57199 10.0946 2.33341 7.33317 2.33341ZM0.666504 7.33342C0.666504 3.65152 3.65127 0.666748 7.33317 0.666748C11.0151 0.666748 13.9998 3.65152 13.9998 7.33342C13.9998 8.87401 13.4773 10.2925 12.5997 11.4215L17.0891 15.9108C17.4145 16.2363 17.4145 16.7639 17.0891 17.0893C16.7637 17.4148 16.236 17.4148 15.9106 17.0893L11.4212 12.6C10.2923 13.4775 8.87376 14.0001 7.33317 14.0001C3.65127 14.0001 0.666504 11.0153 0.666504 7.33342Z" fill="currentColor" /></svg> </i> <i class="c-dataset-search__field-icon-close"> <svg width="12" height="12" viewBox="0 0 12 12" fill="none" xmlns="http://www.w3.org/2000/svg"><path fill-rule="evenodd" clip-rule="evenodd" d="M0.410582 0.410826C0.736019 0.0853888 1.26366 0.0853888 1.58909 0.410826L5.99984 4.82157L10.4106 0.410826C10.736 0.0853893 11.2637 0.0853893 11.5891 0.410826C11.9145 0.736263 11.9145 1.2639 11.5891 1.58934L7.17835 6.00008L11.5891 10.4108C11.9145 10.7363 11.9145 11.2639 11.5891 11.5893C11.2637 11.9148 10.736 11.9148 10.4106 11.5893L5.99984 7.17859L1.58909 11.5893C1.26366 11.9148 0.736019 11.9148 0.410582 11.5893C0.0851447 11.2639 0.0851447 10.7363 0.410582 10.4108L4.82133 6.00008L0.410582 1.58934C0.0851447 1.2639 0.0851447 0.736263 0.410582 0.410826Z" fill="currentColor"/></svg> </i> </div> </div> <div class="c-dataset-search__dd"> <div class="c-dataset-search__filter"> <h5 class="c-dataset-search__label c-dataset-search__label--filter">Filter results: </h5> <ul class="c-dataset-search__list"> <li class="c-dataset-search__list-item"> <button class="c-dataset-search__button" data-term-id="6"> <div class="c-dataset-search__button-icon"> <svg width="12" height="8" viewBox="0 0 12 8" fill="none" xmlns="http://www.w3.org/2000/svg"><path fill-rule="evenodd" clip-rule="evenodd" d="M11.1379 0.195262C11.3983 0.455612 11.3983 0.877722 11.1379 1.13807L4.47124 7.80474C4.21089 8.06509 3.78878 8.06509 3.52843 7.80474L0.861766 5.13807C0.601417 4.87772 0.601417 4.45561 0.861766 4.19526C1.12212 3.93491 1.54423 3.93491 1.80458 4.19526L3.99984 6.39052L10.1951 0.195262C10.4554 -0.0650874 10.8776 -0.0650874 11.1379 0.195262Z" fill="currentColor"/></svg> <img width="28" height="28" src="https://dagshub.com/wp-content/uploads/2023/02/computer-vision-2.svg" class="" alt="" decoding="async" /> </div> <div class="c-dataset-search__button-label">Computer Vision</div> </button> </li> <li class="c-dataset-search__list-item"> <button class="c-dataset-search__button c-dataset-search__button--active" data-term-id="7"> <div class="c-dataset-search__button-icon"> <svg width="12" height="8" viewBox="0 0 12 8" fill="none" xmlns="http://www.w3.org/2000/svg"><path fill-rule="evenodd" clip-rule="evenodd" d="M11.1379 0.195262C11.3983 0.455612 11.3983 0.877722 11.1379 1.13807L4.47124 7.80474C4.21089 8.06509 3.78878 8.06509 3.52843 7.80474L0.861766 5.13807C0.601417 4.87772 0.601417 4.45561 0.861766 4.19526C1.12212 3.93491 1.54423 3.93491 1.80458 4.19526L3.99984 6.39052L10.1951 0.195262C10.4554 -0.0650874 10.8776 -0.0650874 11.1379 0.195262Z" fill="currentColor"/></svg> <img width="28" height="28" src="https://dagshub.com/wp-content/uploads/2023/02/NLP-1.svg" class="" alt="" decoding="async" /> </div> <div class="c-dataset-search__button-label">NLP</div> </button> </li> <li class="c-dataset-search__list-item"> <button class="c-dataset-search__button" data-term-id="9"> <div class="c-dataset-search__button-icon"> <svg width="12" height="8" viewBox="0 0 12 8" fill="none" xmlns="http://www.w3.org/2000/svg"><path fill-rule="evenodd" clip-rule="evenodd" d="M11.1379 0.195262C11.3983 0.455612 11.3983 0.877722 11.1379 1.13807L4.47124 7.80474C4.21089 8.06509 3.78878 8.06509 3.52843 7.80474L0.861766 5.13807C0.601417 4.87772 0.601417 4.45561 0.861766 4.19526C1.12212 3.93491 1.54423 3.93491 1.80458 4.19526L3.99984 6.39052L10.1951 0.195262C10.4554 -0.0650874 10.8776 -0.0650874 11.1379 0.195262Z" fill="currentColor"/></svg> <img width="28" height="28" src="https://dagshub.com/wp-content/uploads/2023/02/tabular.svg" class="" alt="" decoding="async" /> </div> <div class="c-dataset-search__button-label">Tabular</div> </button> </li> <li class="c-dataset-search__list-item"> <button class="c-dataset-search__button" data-term-id="333"> <div class="c-dataset-search__button-icon"> <svg width="12" height="8" viewBox="0 0 12 8" fill="none" xmlns="http://www.w3.org/2000/svg"><path fill-rule="evenodd" clip-rule="evenodd" d="M11.1379 0.195262C11.3983 0.455612 11.3983 0.877722 11.1379 1.13807L4.47124 7.80474C4.21089 8.06509 3.78878 8.06509 3.52843 7.80474L0.861766 5.13807C0.601417 4.87772 0.601417 4.45561 0.861766 4.19526C1.12212 3.93491 1.54423 3.93491 1.80458 4.19526L3.99984 6.39052L10.1951 0.195262C10.4554 -0.0650874 10.8776 -0.0650874 11.1379 0.195262Z" fill="currentColor"/></svg> <img width="28" height="28" src="https://dagshub.com/wp-content/uploads/2023/02/urban.svg" class="" alt="" decoding="async" /> </div> <div class="c-dataset-search__button-label">Urban</div> </button> </li> <li class="c-dataset-search__list-item"> <button class="c-dataset-search__button" data-term-id="39"> <div class="c-dataset-search__button-icon"> <svg width="12" height="8" viewBox="0 0 12 8" fill="none" xmlns="http://www.w3.org/2000/svg"><path fill-rule="evenodd" clip-rule="evenodd" d="M11.1379 0.195262C11.3983 0.455612 11.3983 0.877722 11.1379 1.13807L4.47124 7.80474C4.21089 8.06509 3.78878 8.06509 3.52843 7.80474L0.861766 5.13807C0.601417 4.87772 0.601417 4.45561 0.861766 4.19526C1.12212 3.93491 1.54423 3.93491 1.80458 4.19526L3.99984 6.39052L10.1951 0.195262C10.4554 -0.0650874 10.8776 -0.0650874 11.1379 0.195262Z" fill="currentColor"/></svg> <img width="28" height="28" src="https://dagshub.com/wp-content/uploads/2023/02/biology.svg" class="" alt="" decoding="async" /> </div> <div class="c-dataset-search__button-label">Biology</div> </button> </li> <li class="c-dataset-search__list-item"> <button class="c-dataset-search__button" data-term-id="14"> <div class="c-dataset-search__button-icon"> <svg width="12" height="8" viewBox="0 0 12 8" fill="none" xmlns="http://www.w3.org/2000/svg"><path fill-rule="evenodd" clip-rule="evenodd" d="M11.1379 0.195262C11.3983 0.455612 11.3983 0.877722 11.1379 1.13807L4.47124 7.80474C4.21089 8.06509 3.78878 8.06509 3.52843 7.80474L0.861766 5.13807C0.601417 4.87772 0.601417 4.45561 0.861766 4.19526C1.12212 3.93491 1.54423 3.93491 1.80458 4.19526L3.99984 6.39052L10.1951 0.195262C10.4554 -0.0650874 10.8776 -0.0650874 11.1379 0.195262Z" fill="currentColor"/></svg> <img width="28" height="28" src="https://dagshub.com/wp-content/uploads/2023/02/geology.svg" class="" alt="" decoding="async" /> </div> <div class="c-dataset-search__button-label">Geology</div> </button> </li> <li class="c-dataset-search__list-item"> <button class="c-dataset-search__button" data-term-id="294"> <div class="c-dataset-search__button-icon"> <svg width="12" height="8" viewBox="0 0 12 8" fill="none" xmlns="http://www.w3.org/2000/svg"><path fill-rule="evenodd" clip-rule="evenodd" d="M11.1379 0.195262C11.3983 0.455612 11.3983 0.877722 11.1379 1.13807L4.47124 7.80474C4.21089 8.06509 3.78878 8.06509 3.52843 7.80474L0.861766 5.13807C0.601417 4.87772 0.601417 4.45561 0.861766 4.19526C1.12212 3.93491 1.54423 3.93491 1.80458 4.19526L3.99984 6.39052L10.1951 0.195262C10.4554 -0.0650874 10.8776 -0.0650874 11.1379 0.195262Z" fill="currentColor"/></svg> <img width="28" height="28" src="https://dagshub.com/wp-content/uploads/2023/02/audio.svg" class="" alt="" decoding="async" /> </div> <div class="c-dataset-search__button-label">Audio</div> </button> </li> </ul> </div> <div class="c-dataset-search__results"></div> </div> </div> </div> </div> <div class="b-block-common__posts"> <div class="c-posts"> <article class="c-post-item c-post-item--id-1357 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="344" href="https://dagshub.com/datasets/automatic-speech-recognition-asr-error-robustness/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Automatic Speech Recognition (ASR) Error Robustness </h2> </div> </article> <article class="c-post-item c-post-item--id-1345 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="332" href="https://dagshub.com/datasets/helpful-sentences-from-reviews/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Helpful Sentences from Reviews </h2> </div> </article> <article class="c-post-item c-post-item--id-1340 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="327" href="https://dagshub.com/datasets/learning-to-rank-and-filter-community-question-answering/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Learning to Rank and Filter – community question answering </h2> </div> </article> <article class="c-post-item c-post-item--id-1326 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="313" href="https://dagshub.com/datasets/ai2-tabmcq-multiple-choice-questions-aligned-with-the-aristo-tablestore/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> AI2 TabMCQ: Multiple Choice Questions aligned with the Aristo Tablestore </h2> </div> </article> <article class="c-post-item c-post-item--id-1316 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="303" href="https://dagshub.com/datasets/the-klarna-product-page-dataset/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> The Klarna Product-Page Dataset </h2> </div> </article> <article class="c-post-item c-post-item--id-1296 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="283" href="https://dagshub.com/datasets/multiconer-dataset/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> MultiCoNER Dataset </h2> </div> </article> <article class="c-post-item c-post-item--id-1288 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="275" href="https://dagshub.com/datasets/low-context-name-entity-recognition-ner-datasets-with-gazetteer/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Low Context Name Entity Recognition (NER) Datasets with Gazetteer </h2> </div> </article> <article class="c-post-item c-post-item--id-1280 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="267" href="https://dagshub.com/datasets/wikisum-coherent-summarization-dataset-for-efficient-human-evaluation/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> WikiSum: Coherent Summarization Dataset for Efficient Human-Evaluation </h2> </div> </article> <article class="c-post-item c-post-item--id-1276 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="263" href="https://dagshub.com/datasets/common-screens/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Common Screens </h2> </div> </article> <article class="c-post-item c-post-item--id-1257 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="244" href="https://dagshub.com/datasets/redasa-covid-19-open-data/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> REDASA COVID-19 Open Data </h2> </div> </article> <article class="c-post-item c-post-item--id-1254 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="241" href="https://dagshub.com/datasets/sudachi-language-resources/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Sudachi Language Resources </h2> </div> </article> <article class="c-post-item c-post-item--id-1256 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="243" href="https://dagshub.com/datasets/japanese-tokenizer-dictionaries/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Japanese Tokenizer Dictionaries </h2> </div> </article> <article class="c-post-item c-post-item--id-1265 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="252" href="https://dagshub.com/datasets/answer-reformulation/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Answer Reformulation </h2> </div> </article> <article class="c-post-item c-post-item--id-1252 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="239" href="https://dagshub.com/datasets/common-crawl/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Common Crawl </h2> </div> </article> <article class="c-post-item c-post-item--id-1241 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="228" href="https://dagshub.com/datasets/nlp-fast-ai-datasets/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> NLP – fast.ai datasets </h2> </div> </article> <article class="c-post-item c-post-item--id-1237 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="224" href="https://dagshub.com/datasets/dialoglue-a-natural-language-understanding-benchmark-for-task-oriented-dialogue/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> DialoGLUE: A Natural Language Understanding Benchmark for Task-Oriented Dialogue </h2> </div> </article> <article class="c-post-item c-post-item--id-1231 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="218" href="https://dagshub.com/datasets/voiser/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> VoiSeR </h2> </div> </article> <article class="c-post-item c-post-item--id-1219 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="206" href="https://dagshub.com/datasets/openalex-dataset/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> OpenAlex dataset </h2> </div> </article> <article class="c-post-item c-post-item--id-1196 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="183" href="https://dagshub.com/datasets/zest-zeroshot-learning-from-task-descriptions/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> ZEST: ZEroShot learning from Task descriptions </h2> </div> </article> <article class="c-post-item c-post-item--id-1180 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="167" href="https://dagshub.com/datasets/pre-and-post-purchase-product-questions/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Pre- and post-purchase product questions </h2> </div> </article> <article class="c-post-item c-post-item--id-1176 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="163" href="https://dagshub.com/datasets/amazon-pqa/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Amazon-PQA </h2> </div> </article> <article class="c-post-item c-post-item--id-1162 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="149" href="https://dagshub.com/datasets/cms-2008-2010-data-entrepreneurs-synthetic-public-use-file-de-synpuf-in-omop-common-data-model/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> CMS 2008-2010 Data Entrepreneurs’ Synthetic Public Use File (DE-SynPUF) in OMOP Common Data Model </h2> </div> </article> <article class="c-post-item c-post-item--id-1161 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="148" href="https://dagshub.com/datasets/ai2-diagram-dataset-ai2d/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> AI2 Diagram Dataset (AI2D) </h2> </div> </article> <article class="c-post-item c-post-item--id-1151 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="138" href="https://dagshub.com/datasets/textbook-question-answering-tqa/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Textbook Question Answering (TQA) </h2> </div> </article> <article class="c-post-item c-post-item--id-1146 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="133" href="https://dagshub.com/datasets/synthea-synthetic-patient-generator-data-in-omop-common-data-model/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Synthea synthetic patient generator data in OMOP Common Data Model </h2> </div> </article> <article class="c-post-item c-post-item--id-1140 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="127" href="https://dagshub.com/datasets/ai2-tablestore-november-2015-snapshot/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> AI2 Tablestore (November 2015 Snapshot) </h2> </div> </article> <article class="c-post-item c-post-item--id-1136 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="123" href="https://dagshub.com/datasets/humor-detection-from-product-question-answering-systems/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Humor Detection from Product Question Answering Systems </h2> </div> </article> <article class="c-post-item c-post-item--id-1128 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="115" href="https://dagshub.com/datasets/aristo-tuple-kb/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Aristo Tuple KB </h2> </div> </article> <article class="c-post-item c-post-item--id-1116 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="103" href="https://dagshub.com/datasets/humor-patterns-used-for-querying-alexa-traffic/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Humor patterns used for querying Alexa traffic </h2> </div> </article> <article class="c-post-item c-post-item--id-1113 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="100" href="https://dagshub.com/datasets/discrete-reasoning-over-the-content-of-paragraphs-drop/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Discrete Reasoning Over the content of Paragraphs (DROP) </h2> </div> </article> <article class="c-post-item c-post-item--id-1094 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="81" href="https://dagshub.com/datasets/the-massively-multilingual-image-dataset-mmid/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> The Massively Multilingual Image Dataset (MMID) </h2> </div> </article> <article class="c-post-item c-post-item--id-1096 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="83" href="https://dagshub.com/datasets/wizard-of-tasks/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Wizard of Tasks </h2> </div> </article> <article class="c-post-item c-post-item--id-1088 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="75" href="https://dagshub.com/datasets/reasoning-over-paragraph-effects-in-situations-ropes/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Reasoning Over Paragraph Effects in Situations (ROPES) </h2> </div> </article> <article class="c-post-item c-post-item--id-1086 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="73" href="https://dagshub.com/datasets/quoref/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Quoref </h2> </div> </article> <article class="c-post-item c-post-item--id-1074 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="61" href="https://dagshub.com/datasets/provision-of-web-scale-parallel-corpora-for-official-european-languages-paracrawl/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Provision of Web-Scale Parallel Corpora for Official European Languages (ParaCrawl) </h2> </div> </article> <article class="c-post-item c-post-item--id-1065 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="52" href="https://dagshub.com/datasets/enriched-topical-chat-dataset-for-knowledge-grounded-dialogue-systems/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Enriched Topical-Chat Dataset for Knowledge-Grounded Dialogue Systems </h2> </div> </article> <article class="c-post-item c-post-item--id-1055 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="42" href="https://dagshub.com/datasets/national-archives-catalog/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> National Archives Catalog </h2> </div> </article> <article class="c-post-item c-post-item--id-1049 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="36" href="https://dagshub.com/datasets/google-books-ngrams/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Google Books Ngrams </h2> </div> </article> <article class="c-post-item c-post-item--id-1044 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="31" href="https://dagshub.com/datasets/pass-perturb-and-select-summarizer-for-product-reviews/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> PASS: Perturb-and-Select Summarizer for Product Reviews </h2> </div> </article> <article class="c-post-item c-post-item--id-1037 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="24" href="https://dagshub.com/datasets/multilingual-name-entity-recognition-ner-datasets-with-gazetteer/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Multilingual Name Entity Recognition (NER) Datasets with Gazetteer </h2> </div> </article> <article class="c-post-item c-post-item--id-1034 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="21" href="https://dagshub.com/datasets/phrase-clustering-dataset-pcd/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Phrase Clustering Dataset (PCD) </h2> </div> </article> <article class="c-post-item c-post-item--id-1018 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="5" href="https://dagshub.com/datasets/the-multilingual-amazon-reviews-corpus/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> The Multilingual Amazon Reviews Corpus </h2> </div> </article> <article class="c-post-item c-post-item--id-1019 c-post-item--type-datasets c-posts__item" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="" data-repo-id="6" href="https://dagshub.com/datasets/software-heritage-graph-dataset/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Software Heritage Graph Dataset </h2> </div> </article> </div> </div> </div> </section> <section id="b-oob-cta-428779" class="c-block b-block b-oob-cta b-oob b-oob-cta--layout-default c-block--padding-default b-oob--style-boxed-container b-oob--style-small-padding-bottom b-oob--style-small-padding-top "> <div class="c-background "> <div class="c-background__color" style="background-color: #ededed"></div> <div class="c-background__media"> <div class=" c-media " > <div class="c-media__element c-media__element--type-lottie c-media__element--all" style="top:0;bottom:0;"> <dotlottie-player class="c-lottie " data-offset="500" autoplay data-src="https://dagshub.com/wp-content/uploads/2023/01/20230130-130007lf30_editor_pxhmkthw.lottie" loop data-replay="true" ></dotlottie-player> </div> </div> </div> <div class="container c-block__content"> <div class="b-oob-cta b-oob-inner"> <div class="c-cta c-cta--id-85 c-cta--style-default"> <div class="c-cta__inner"> <div class="c-cta__col c-cta__col--body"> <div class="c-section-header c-section-header--align-default "> <h2 class="c-title c-section-header__title default" style="color: #f4f4f4 !important" > Improve your data quality for better AI<br /> </h2> <h4 class="c-title c-section-header__subtitle default" style="color: #f4f4f4 !important" > Easily curate and annotate your vision, audio, and document data with a single platform<br /> </h4> </div> </div> <div class="c-cta__col c-cta__col--action"> <div class="c-buttons-or-form "> <ul class="c-buttons "> <li class="c-button testimonials-section__bottom-action c-button--type-link c-button__style--primary-outline-white-bg"> <a data-analytics-event="DataSet Page SignUp CTA Clicked" class="c-btn c-btn-primary-outline-white-bg" href="https://dagshub.com/book-a-demo/" target="_blank" title="Book A Demo"> Book A Demo </a> </li> </ul> </div> </div> </div> </div> </div> </div> </div></section> <div class="c-posts-alt c-posts-alt--items-4" data-count="4" data-total="8"> <div class="container"> <div class="c-posts-alt__head"> <h2 class="c-title">More categories</h2> </div> <div class="c-posts-alt__body"> <div class="c-post-item c-post-item--alt "> <a data-analytics-event="More_categories_Clicked" href="https://dagshub.com/datasets/audio/" title="Audio" class="c-post-item__link"></a> <div class="c-post-item__image"> <img width="28" height="28" src="https://dagshub.com/wp-content/uploads/2023/02/audio.svg" class="" alt="" decoding="async" loading="lazy" /> </div> <h3 class="c-post-item__title">Audio</h3> </div> <div class="c-post-item c-post-item--alt "> <a data-analytics-event="More_categories_Clicked" href="https://dagshub.com/datasets/biology/" title="Biology" class="c-post-item__link"></a> <div class="c-post-item__image"> <img width="28" height="28" src="https://dagshub.com/wp-content/uploads/2023/02/biology.svg" class="" alt="" decoding="async" loading="lazy" /> </div> <h3 class="c-post-item__title">Biology</h3> </div> <div class="c-post-item c-post-item--alt "> <a data-analytics-event="More_categories_Clicked" href="https://dagshub.com/datasets/computer-vision/" title="Computer Vision" class="c-post-item__link"></a> <div class="c-post-item__image"> <img width="28" height="28" src="https://dagshub.com/wp-content/uploads/2023/02/computer-vision-2.svg" class="" alt="" decoding="async" loading="lazy" /> </div> <h3 class="c-post-item__title">Computer Vision</h3> </div> <div class="c-post-item c-post-item--alt "> <a data-analytics-event="More_categories_Clicked" href="https://dagshub.com/datasets/geology/" title="Geology" class="c-post-item__link"></a> <div class="c-post-item__image"> <img width="28" height="28" src="https://dagshub.com/wp-content/uploads/2023/02/geology.svg" class="" alt="" decoding="async" loading="lazy" /> </div> <h3 class="c-post-item__title">Geology</h3> </div> <div class="c-post-item c-post-item--alt "> <a data-analytics-event="More_categories_Clicked" href="https://dagshub.com/datasets/tabular/" title="Tabular" class="c-post-item__link"></a> <div class="c-post-item__image"> <img width="28" height="28" src="https://dagshub.com/wp-content/uploads/2023/02/tabular.svg" class="" alt="" decoding="async" loading="lazy" /> </div> <h3 class="c-post-item__title">Tabular</h3> </div> <div class="c-post-item c-post-item--alt "> <a data-analytics-event="More_categories_Clicked" href="https://dagshub.com/datasets/urban/" title="Urban" class="c-post-item__link"></a> <div class="c-post-item__image"> <img width="28" height="28" src="https://dagshub.com/wp-content/uploads/2023/02/urban.svg" class="" alt="" decoding="async" loading="lazy" /> </div> <h3 class="c-post-item__title">Urban</h3> </div> <article class="c-posts-item c-posts-alt__button c-post-item--action js-load-more-category-posts"> <span><button class="c-btn c-btn-primary-link" data-analytics-event="More_categories_Clicked" > Show more<svg width="16" height="16" viewBox="0 0 16 16" fill="none" xmlns="http://www.w3.org/2000/svg"><path fill-rule="evenodd" clip-rule="evenodd" d="M8.19527 4.19526C8.45562 3.93491 8.87773 3.93491 9.13808 4.19526L12.4714 7.5286C12.5964 7.65362 12.6667 7.82319 12.6667 8C12.6667 8.17681 12.5964 8.34638 12.4714 8.47141L9.13808 11.8047C8.87773 12.0651 8.45562 12.0651 8.19527 11.8047C7.93492 11.5444 7.93492 11.1223 8.19527 10.8619L10.3905 8.66667L4.00001 8.66667C3.63182 8.66667 3.33334 8.36819 3.33334 8C3.33334 7.63181 3.63182 7.33333 4.00001 7.33333L10.3905 7.33333L8.19527 5.13807C7.93492 4.87772 7.93492 4.45561 8.19527 4.19526Z" fill="currentColor"/></svg> </button></span> </article> </div> </div> </div> </main> </div><!-- #content --> <div class="site-pre-footer"> <div class="container"> <div class="content-wrapper"> <h3 class="title"> Manage your unstructured data. Scale to millions of experiments today. </h3> <p class="description">See how leading data scientists manage their data.</p> <div class="button-group"> <a href="/book-a-demo/" target="" class="btn btn__lg btn--primary" data-analytics-event="Footer_StartFree_Clicked">Book A Demo</a> </div> </div> </div> </div> <div class="site-footer"> <div class="container"> <div class="site-footer__wrap"> <div class="site-footer__logo"> <div class="site-logo"> <a href="https://dagshub.com/" class="custom-logo-link" rel="home"><img width="143" height="40" src="https://dagshub.com/wp-content/uploads/2024/04/dagshab.svg" class="custom-logo" alt="DagsHub" decoding="async" /></a> </div> <div class="site-footer__social"> <!-- <h3 class="wdiget-title">Follow us</h3> --> <ul class="social-list"> <li class="social-list__item"> <a href="https://twitter.com/TheRealDAGsHub" target="_blank" class="social-list__link"><svg class="svg-icon icon-twitter" width="18" height="18""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-twitter"></use></svg><span class="screen-reader-text"></span></a> </li> <li class="social-list__item"> <a href="https://www.linkedin.com/company/dagshub" target="_blank" class="social-list__link"><svg class="svg-icon icon-linkedin" width="18" height="18""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-linkedin"></use></svg><span class="screen-reader-text"></span></a> </li> <li class="social-list__item"> <a href="https://youtube.com/c/dagshub" target="_blank" class="social-list__link"><svg class="svg-icon icon-youtube" width="18" height="18""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-youtube"></use></svg><span class="screen-reader-text"></span></a> </li> <li class="social-list__item"> <a href="https://discord.com/invite/9gU36Y6" target="_blank" class="social-list__link"><svg class="svg-icon icon-discord" width="18" height="18""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-discord"></use></svg><span class="screen-reader-text"></span></a> </li> </ul> </div> <img src="https://dagshub.com/wp-content/uploads/2024/04/image-54.png" alt="" class="bottom_logo"/> </div> <div class="site-footer__frame"> <div class="site-footer__holder"> <div class="site-footer__nav"> <ul id="menu-pro-footer-menu" class="footer-nav"><li id="menu-item-14" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-has-children menu-item-14"><a>Resources</a> <ul class="sub-menu"> <li id="menu-item-15" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-15"><a href="https://dagshub.com/docs">Docs</a></li> <li id="menu-item-16" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-16"><a href="https://dagshub.com/blog">Blog</a></li> <li id="menu-item-101" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-101"><a href="/datasets/">Datasets</a></li> <li id="menu-item-1586" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-1586"><a href="/glossary/">Glossary</a></li> <li id="menu-item-2247" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2247"><a href="https://dagshub.com/blog/tag/case-study/">Case Studies</a></li> <li id="menu-item-2244" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2244"><a href="https://dagshub.com/blog/tag/tutorials/">Tutorials & Webinars</a></li> </ul> </li> <li id="menu-item-1708" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-has-children menu-item-1708"><a>Product</a> <ul class="sub-menu"> <li id="menu-item-2076" class="menu-item menu-item-type-post_type menu-item-object-page menu-item-2076"><a href="https://dagshub.com/data-engine/">Data Engine</a></li> <li id="menu-item-2250" class="menu-item menu-item-type-post_type menu-item-object-page menu-item-2250"><a href="https://dagshub.com/use-cases/llm/">LLMs</a></li> <li id="menu-item-1463" class="menu-item menu-item-type-post_type menu-item-object-page menu-item-1463"><a href="https://dagshub.com/product/">Platform</a></li> <li id="menu-item-1711" class="menu-item menu-item-type-post_type menu-item-object-page menu-item-1711"><a href="https://dagshub.com/enterprise/">Enterprise</a></li> <li id="menu-item-2464" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2464"><a href="https://dagshub.com/pricing">Pricing</a></li> </ul> </li> <li id="menu-item-2347" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-has-children menu-item-2347"><a>Company</a> <ul class="sub-menu"> <li id="menu-item-2348" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2348"><a href="https://dagshub.com/about">About</a></li> <li id="menu-item-2349" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2349"><a href="https://dagshub.com/careers">Careers</a></li> <li id="menu-item-2350" class="menu-item menu-item-type-post_type menu-item-object-page menu-item-2350"><a href="https://dagshub.com/contact-us/">Contact us</a></li> </ul> </li> <li id="menu-item-18" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-has-children menu-item-18"><a>Community</a> <ul class="sub-menu"> <li id="menu-item-17" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-17"><a href="https://dagshub.com/explore/repos">Explore</a></li> </ul> </li> </ul> </div> <div class="site-footer__info"> </div> </div> </div> <div class="footer_subcscription"> <div class="wpcf7 no-js" id="wpcf7-f2374-o1" lang="en-US" dir="ltr"> <div class="screen-reader-response"><p role="status" aria-live="polite" aria-atomic="true"></p> <ul></ul></div> <form action="/datasets/nlp/#wpcf7-f2374-o1" method="post" class="wpcf7-form init" aria-label="Contact form" novalidate="novalidate" data-status="init"> <div style="display: none;"> <input type="hidden" name="_wpcf7" value="2374" /> <input type="hidden" name="_wpcf7_version" value="5.9.8" /> <input type="hidden" name="_wpcf7_locale" value="en_US" /> <input type="hidden" name="_wpcf7_unit_tag" value="wpcf7-f2374-o1" /> <input type="hidden" name="_wpcf7_container_post" value="0" /> <input type="hidden" name="_wpcf7_posted_data_hash" value="" /> <input type="hidden" name="_wpcf7_recaptcha_response" value="" /> </div> <div class="footer-subcription-box"> <h3 class="title">ML Newsletter</h3> <p class="description">Top MLOps articles, case studies, events (and more) in your inbox every month</p> <div class="form-wrap c-form-subscription"> <div class="c-form-primary__field"><span class="wpcf7-form-control-wrap" data-name="your-email"><input size="40" maxlength="400" class="wpcf7-form-control wpcf7-email wpcf7-validates-as-required wpcf7-text wpcf7-validates-as-email" autocomplete="email" aria-required="true" aria-invalid="false" placeholder="Email" value="" type="email" name="your-email" /></span></div> <input class="wpcf7-form-control wpcf7-submit has-spinner" type="submit" value="Subscribe" /> </div> <div id="customMessage" style="display: none;"> You're subscribed! Check your inbox for exciting updates! </div> </div><div class="wpcf7-response-output" aria-hidden="true"></div> </form> </div> </div> </div> <div class="site-footer__row"> <div class="site-footer__copy">©2024 © Copyright Dagshub 2023</div> </div> </div> <div class="elipse-background"></div> <div class="elipse-background right"></div> </div> </div> <div class="modal fade c-modal c-modal-default cf7-form-modal show" tabindex="-1" id="modal-1687"> <div class="modal-dialog"> <div class="modal-content"> <div class="modal-header"> Contact us </div> <div class="modal-body"> <div class="wpcf7 no-js" id="wpcf7-f1687-o2" lang="en-US" dir="ltr"> <div class="screen-reader-response"><p role="status" aria-live="polite" aria-atomic="true"></p> <ul></ul></div> <form action="/datasets/nlp/#wpcf7-f1687-o2" method="post" class="wpcf7-form init" aria-label="Contact form" novalidate="novalidate" data-status="init"> <div style="display: none;"> <input type="hidden" name="_wpcf7" value="1687" /> <input type="hidden" name="_wpcf7_version" value="5.9.8" /> <input type="hidden" name="_wpcf7_locale" value="en_US" /> <input type="hidden" name="_wpcf7_unit_tag" value="wpcf7-f1687-o2" /> <input type="hidden" name="_wpcf7_container_post" value="0" /> <input type="hidden" name="_wpcf7_posted_data_hash" value="" /> <input type="hidden" name="_wpcf7_recaptcha_response" value="" /> </div> <div class="c-form-primary"> <div class="c-form-primary__row"> <div class="c-form-primary__field"> <label for="first-name" class="c-form-primary__label">First Name</label> <div class="c-form-primary__field-element"> <span class="wpcf7-form-control-wrap" data-name="first-name"><input size="40" maxlength="400" class="wpcf7-form-control wpcf7-text wpcf7-validates-as-required required" aria-required="true" aria-invalid="false" placeholder="Enter your first name here" value="" type="text" name="first-name" /></span> </div> </div> </div> <div class="c-form-primary__row"> <div class="c-form-primary__field"> <label for="last-name" class="c-form-primary__label">Last Name</label> <div class="c-form-primary__field-element"> <span class="wpcf7-form-control-wrap" data-name="last-name"><input size="40" maxlength="400" class="wpcf7-form-control wpcf7-text wpcf7-validates-as-required required" aria-required="true" aria-invalid="false" placeholder="Enter your last name here" value="" type="text" name="last-name" /></span> </div> </div> </div> <div class="c-form-primary__row"> <div class="c-form-primary__field"> <label for="clients-email" class="c-form-primary__label">Work email</label> <div class="c-form-primary__field-element"> <span class="wpcf7-form-control-wrap" data-name="clients-email"><input size="40" maxlength="400" class="wpcf7-form-control wpcf7-email wpcf7-validates-as-required wpcf7-text wpcf7-validates-as-email required" aria-required="true" aria-invalid="false" placeholder="Enter your work email here" value="" type="email" name="clients-email" /></span> </div> </div> </div> <div class="c-form-primary__row"> <div class="c-form-primary__field"> <label for="Company-name" class="c-form-primary__label">Company name</label> <div class="c-form-primary__field-element"> <span class="wpcf7-form-control-wrap" data-name="company-name"><input size="40" maxlength="400" class="wpcf7-form-control wpcf7-text wpcf7-validates-as-required required" aria-required="true" aria-invalid="false" placeholder="Enter your company name here" value="" type="text" name="company-name" /></span> </div> </div> </div> <div class="c-form-primary__row"> <div class="c-form-primary__field"> <label for="job-title" class="c-form-primary__label">Job title</label> <div class="c-form-primary__field-element"> <span class="wpcf7-form-control-wrap" data-name="job-title"><input size="40" maxlength="400" class="wpcf7-form-control wpcf7-text wpcf7-validates-as-required required" aria-required="true" aria-invalid="false" placeholder="Enter your job title here" value="" type="text" name="job-title" /></span> </div> </div> </div> <div class="c-form-primary__actions"> <input class="wpcf7-form-control wpcf7-submit has-spinner" type="submit" value="Request a demo" /> </div> </div><div class="wpcf7-response-output" aria-hidden="true"></div> </form> </div> </div> </div> </div> </div> <script src="https://dagshub.com/wp-includes/js/dist/hooks.min.js?ver=2810c76e705dd1a53b18" id="wp-hooks-js"></script> <script src="https://dagshub.com/wp-includes/js/dist/i18n.min.js?ver=5e580eb46a90c2b997e6" id="wp-i18n-js"></script> <script id="wp-i18n-js-after"> wp.i18n.setLocaleData( { 'text direction\u0004ltr': [ 'ltr' ] } ); </script> <script src="https://dagshub.com/wp-content/plugins/contact-form-7/includes/swv/js/index.js?ver=5.9.8" id="swv-js"></script> <script id="contact-form-7-js-extra"> var wpcf7 = {"api":{"root":"https:\/\/dagshub.com\/wp-json\/","namespace":"contact-form-7\/v1"},"cached":"1"}; </script> <script src="https://dagshub.com/wp-content/plugins/contact-form-7/includes/js/index.js?ver=5.9.8" id="contact-form-7-js"></script> <script src="https://dagshub.com/wp-includes/js/jquery/jquery.min.js?ver=3.7.1" id="jquery-core-js"></script> <script src="https://dagshub.com/wp-includes/js/jquery/jquery-migrate.min.js?ver=3.4.1" id="jquery-migrate-js"></script> <script src="https://dagshub.com/wp-content/themes/wp-d-theme/vendors/fancybox/fancybox.min.js?ver=4.0.31" id="fancybox-new-js-js"></script> <script src="https://dagshub.com/wp-content/themes/wp-d-theme/vendors/jquery.main.js?ver=1724154105" id="custom-js"></script> <script id="scripts-js-extra"> var air_light_screenReaderText = {"expand":"Open child menu","collapse":"Close child menu","expand_for":"Open child menu for","collapse_for":"Close child menu for","expand_toggle":"Open main menu","collapse_toggle":"Close main menu","external_link":"External site","target_blank":"opens in a new window","previous_slide":"Previous slide","next_slide":"Next slide","last_slide":"Last slide","skip_slider":"Skip over the carousel element"}; var air_light_externalLinkDomains = ["localhost:3000","airdev.test","airwptheme.com","localhost"]; </script> <script src="https://dagshub.com/wp-content/themes/wp-d-theme/js/prod/front-end.js?ver=1724154107" id="scripts-js"></script> <script src="https://www.google.com/recaptcha/api.js?render=6LfHrukpAAAAAA9UYBYO1jTWc1qASGHFOc5xtGfG&ver=3.0" id="google-recaptcha-js"></script> <script src="https://dagshub.com/wp-includes/js/dist/vendor/wp-polyfill.min.js?ver=3.15.0" id="wp-polyfill-js"></script> <script id="wpcf7-recaptcha-js-extra"> var wpcf7_recaptcha = {"sitekey":"6LfHrukpAAAAAA9UYBYO1jTWc1qASGHFOc5xtGfG","actions":{"homepage":"homepage","contactform":"contactform"}}; </script> <script src="https://dagshub.com/wp-content/plugins/contact-form-7/modules/recaptcha/index.js?ver=5.9.8" id="wpcf7-recaptcha-js"></script> <a href="#page" id="top" class="top no-external-link-indicator" data-version="9.2.2"> <span class="screen-reader-text">Back to top</span> <span aria-hidden="true"><svg width="6" height="4" viewBox="0 0 6 4" fill="none" xmlns="http://www.w3.org/2000/svg"> <path d="M3 0.000342107L6 3.00034L5.4625 3.53784L3 1.06284L0.537501 3.52534L5.2492e-07 2.98784L3 0.000342107Z" fill="currentColor" /> </svg> </span> </a> </body> </html>