CINXE.COM
Free Japanese Tokenizer Dictionaries Dataset | DagsHub
<!doctype html> <html lang="en-US"> <head> <meta charset="UTF-8"> <meta name="viewport" content="width=device-width, initial-scale=1"> <link rel="profile" href="http://gmpg.org/xfn/11"> <script> // Constants const SIGN_IN_STATUS_ATTRIBUTE = 'data-md-signed-in', SIGNED_IN_STATUS = 'true', SIGNED_OUT_STATUS = 'false'; const SIGN_IN_USERNAME_COOKIE = 'dags_awesome', SIGN_IN_USER_ID_COOKIE = 'ajs_user_id'; const base_url = 'https://dagshub.com', ajax_url = 'https://dagshub.com/wp-admin/admin-ajax.php'; const getCookie = (name) => { let match = document.cookie.match(new RegExp('(^| )' + name + '=([^;]+)')); if (match) return match[2]; }; const is_home = false // Handling Signed in status let username = getCookie(SIGN_IN_USERNAME_COOKIE); let user_id = getCookie(SIGN_IN_USER_ID_COOKIE); if (username && user_id) { // document.body.setAttribute( // SIGN_IN_STATUS_ATTRIBUTE, // SIGNED_IN_STATUS // ); if(is_home){ location.replace(base_url+"/dashboard"); } // $('.profile-menu .avatar').attr("src", "/avatars/" + user_id); // $('.profile-menu .name').text(username); // $('#user-profile-link').attr("href", "/" + username); } else { document.body.setAttribute( SIGN_IN_STATUS_ATTRIBUTE, SIGNED_OUT_STATUS ); } </script> <meta name='robots' content='index, follow, max-image-preview:large, max-snippet:-1, max-video-preview:-1' /> <!-- This site is optimized with the Yoast SEO plugin v23.4 - https://yoast.com/wordpress/plugins/seo/ --> <title>Free Japanese Tokenizer Dictionaries Dataset | DagsHub</title> <meta name="description" content="Free Japanese Tokenizer Dictionaries dataset for machine learning. Find the right dataset for your model." /> <link rel="canonical" href="https://dagshub.com/datasets/japanese-tokenizer-dictionaries/" /> <meta property="og:locale" content="en_US" /> <meta property="og:type" content="article" /> <meta property="og:title" content="Free Japanese Tokenizer Dictionaries Dataset | DagsHub" /> <meta property="og:description" content="Free Japanese Tokenizer Dictionaries dataset for machine learning. Find the right dataset for your model." /> <meta property="og:url" content="https://dagshub.com/datasets/japanese-tokenizer-dictionaries/" /> <meta property="og:site_name" content="DagsHub" /> <meta property="article:modified_time" content="2023-02-21T12:32:23+00:00" /> <meta property="og:image" content="https://dagshub.com/wp-content/uploads/2023/04/General_OG_Image.jpg" /> <meta property="og:image:width" content="1200" /> <meta property="og:image:height" content="630" /> <meta property="og:image:type" content="image/jpeg" /> <meta name="twitter:card" content="summary_large_image" /> <meta name="twitter:site" content="@TheRealDagsHub" /> <script type="application/ld+json" class="yoast-schema-graph">{"@context":"https://schema.org","@graph":[{"@type":"WebPage","@id":"https://dagshub.com/datasets/japanese-tokenizer-dictionaries/","url":"https://dagshub.com/datasets/japanese-tokenizer-dictionaries/","name":"Free Japanese Tokenizer Dictionaries Dataset | DagsHub","isPartOf":{"@id":"https://dagshub.com/#website"},"datePublished":"2023-02-21T12:32:21+00:00","dateModified":"2023-02-21T12:32:23+00:00","description":"Free Japanese Tokenizer Dictionaries dataset for machine learning. Find the right dataset for your model.","breadcrumb":{"@id":"https://dagshub.com/datasets/japanese-tokenizer-dictionaries/#breadcrumb"},"inLanguage":"en-US","potentialAction":[{"@type":"ReadAction","target":["https://dagshub.com/datasets/japanese-tokenizer-dictionaries/"]}]},{"@type":"BreadcrumbList","@id":"https://dagshub.com/datasets/japanese-tokenizer-dictionaries/#breadcrumb","itemListElement":[{"@type":"ListItem","position":1,"name":"Datasets","item":"https://dagshub.com/datasets/"},{"@type":"ListItem","position":2,"name":"NLP","item":"https://dagshub.com/datasets/nlp/"},{"@type":"ListItem","position":3,"name":"Japanese Tokenizer Dictionaries"}]},{"@type":"WebSite","@id":"https://dagshub.com/#website","url":"https://dagshub.com/","name":"DagsHub","description":"","publisher":{"@id":"https://dagshub.com/#organization"},"potentialAction":[{"@type":"SearchAction","target":{"@type":"EntryPoint","urlTemplate":"https://dagshub.com/?s={search_term_string}"},"query-input":{"@type":"PropertyValueSpecification","valueRequired":true,"valueName":"search_term_string"}}],"inLanguage":"en-US"},{"@type":"Organization","@id":"https://dagshub.com/#organization","name":"DagsHub","url":"https://dagshub.com/","logo":{"@type":"ImageObject","inLanguage":"en-US","@id":"https://dagshub.com/#/schema/logo/image/","url":"https://dagshub.com/wp-content/uploads/2024/04/dagshab.svg","contentUrl":"https://dagshub.com/wp-content/uploads/2024/04/dagshab.svg","width":143,"height":40,"caption":"DagsHub"},"image":{"@id":"https://dagshub.com/#/schema/logo/image/"},"sameAs":["https://x.com/TheRealDagsHub","https://www.linkedin.com/company/dagshub"]}]}</script> <!-- / Yoast SEO plugin. --> <link rel='dns-prefetch' href='//dagshub.com' /> <link rel="alternate" type="application/rss+xml" title="DagsHub » Feed" href="https://dagshub.com/feed/" /> <link rel="alternate" type="application/rss+xml" title="DagsHub » Comments Feed" href="https://dagshub.com/comments/feed/" /> <link rel="alternate" type="application/rss+xml" title="DagsHub » Japanese Tokenizer Dictionaries Comments Feed" href="https://dagshub.com/datasets/japanese-tokenizer-dictionaries/feed/" /> <script> window._wpemojiSettings = {"baseUrl":"https:\/\/s.w.org\/images\/core\/emoji\/15.0.3\/72x72\/","ext":".png","svgUrl":"https:\/\/s.w.org\/images\/core\/emoji\/15.0.3\/svg\/","svgExt":".svg","source":{"concatemoji":"https:\/\/dagshub.com\/wp-includes\/js\/wp-emoji-release.min.js?ver=4e55ae54fa701286f578c2d0b9d76284"}}; /*! This file is auto-generated */ !function(i,n){var o,s,e;function c(e){try{var t={supportTests:e,timestamp:(new Date).valueOf()};sessionStorage.setItem(o,JSON.stringify(t))}catch(e){}}function p(e,t,n){e.clearRect(0,0,e.canvas.width,e.canvas.height),e.fillText(t,0,0);var t=new Uint32Array(e.getImageData(0,0,e.canvas.width,e.canvas.height).data),r=(e.clearRect(0,0,e.canvas.width,e.canvas.height),e.fillText(n,0,0),new Uint32Array(e.getImageData(0,0,e.canvas.width,e.canvas.height).data));return t.every(function(e,t){return e===r[t]})}function u(e,t,n){switch(t){case"flag":return n(e,"\ud83c\udff3\ufe0f\u200d\u26a7\ufe0f","\ud83c\udff3\ufe0f\u200b\u26a7\ufe0f")?!1:!n(e,"\ud83c\uddfa\ud83c\uddf3","\ud83c\uddfa\u200b\ud83c\uddf3")&&!n(e,"\ud83c\udff4\udb40\udc67\udb40\udc62\udb40\udc65\udb40\udc6e\udb40\udc67\udb40\udc7f","\ud83c\udff4\u200b\udb40\udc67\u200b\udb40\udc62\u200b\udb40\udc65\u200b\udb40\udc6e\u200b\udb40\udc67\u200b\udb40\udc7f");case"emoji":return!n(e,"\ud83d\udc26\u200d\u2b1b","\ud83d\udc26\u200b\u2b1b")}return!1}function f(e,t,n){var r="undefined"!=typeof WorkerGlobalScope&&self instanceof WorkerGlobalScope?new OffscreenCanvas(300,150):i.createElement("canvas"),a=r.getContext("2d",{willReadFrequently:!0}),o=(a.textBaseline="top",a.font="600 32px Arial",{});return e.forEach(function(e){o[e]=t(a,e,n)}),o}function t(e){var t=i.createElement("script");t.src=e,t.defer=!0,i.head.appendChild(t)}"undefined"!=typeof Promise&&(o="wpEmojiSettingsSupports",s=["flag","emoji"],n.supports={everything:!0,everythingExceptFlag:!0},e=new Promise(function(e){i.addEventListener("DOMContentLoaded",e,{once:!0})}),new Promise(function(t){var n=function(){try{var e=JSON.parse(sessionStorage.getItem(o));if("object"==typeof e&&"number"==typeof e.timestamp&&(new Date).valueOf()<e.timestamp+604800&&"object"==typeof e.supportTests)return e.supportTests}catch(e){}return null}();if(!n){if("undefined"!=typeof Worker&&"undefined"!=typeof OffscreenCanvas&&"undefined"!=typeof URL&&URL.createObjectURL&&"undefined"!=typeof Blob)try{var e="postMessage("+f.toString()+"("+[JSON.stringify(s),u.toString(),p.toString()].join(",")+"));",r=new Blob([e],{type:"text/javascript"}),a=new Worker(URL.createObjectURL(r),{name:"wpTestEmojiSupports"});return void(a.onmessage=function(e){c(n=e.data),a.terminate(),t(n)})}catch(e){}c(n=f(s,u,p))}t(n)}).then(function(e){for(var t in e)n.supports[t]=e[t],n.supports.everything=n.supports.everything&&n.supports[t],"flag"!==t&&(n.supports.everythingExceptFlag=n.supports.everythingExceptFlag&&n.supports[t]);n.supports.everythingExceptFlag=n.supports.everythingExceptFlag&&!n.supports.flag,n.DOMReady=!1,n.readyCallback=function(){n.DOMReady=!0}}).then(function(){return e}).then(function(){var e;n.supports.everything||(n.readyCallback(),(e=n.source||{}).concatemoji?t(e.concatemoji):e.wpemoji&&e.twemoji&&(t(e.twemoji),t(e.wpemoji)))}))}((window,document),window._wpemojiSettings); </script> <link rel='stylesheet' id='block-editor-styles-css' href='https://dagshub.com/wp-content/themes/wp-d-theme/css/prod/editor.css?ver=1732810781' type='text/css' media='all' /> <style id='wp-emoji-styles-inline-css' type='text/css'> img.wp-smiley, img.emoji { display: inline !important; border: none !important; box-shadow: none !important; height: 1em !important; width: 1em !important; margin: 0 0.07em !important; vertical-align: -0.1em !important; background: none !important; padding: 0 !important; } </style> <link rel='stylesheet' id='wp-block-library-css' href='https://dagshub.com/wp-includes/css/dist/block-library/style.min.css?ver=4e55ae54fa701286f578c2d0b9d76284' type='text/css' media='all' /> <style id='wp-block-library-theme-inline-css' type='text/css'> .wp-block-audio :where(figcaption){color:#555;font-size:13px;text-align:center}.is-dark-theme .wp-block-audio :where(figcaption){color:#ffffffa6}.wp-block-audio{margin:0 0 1em}.wp-block-code{border:1px solid #ccc;border-radius:4px;font-family:Menlo,Consolas,monaco,monospace;padding:.8em 1em}.wp-block-embed :where(figcaption){color:#555;font-size:13px;text-align:center}.is-dark-theme .wp-block-embed :where(figcaption){color:#ffffffa6}.wp-block-embed{margin:0 0 1em}.blocks-gallery-caption{color:#555;font-size:13px;text-align:center}.is-dark-theme .blocks-gallery-caption{color:#ffffffa6}:root :where(.wp-block-image figcaption){color:#555;font-size:13px;text-align:center}.is-dark-theme :root :where(.wp-block-image figcaption){color:#ffffffa6}.wp-block-image{margin:0 0 1em}.wp-block-pullquote{border-bottom:4px solid;border-top:4px solid;color:currentColor;margin-bottom:1.75em}.wp-block-pullquote cite,.wp-block-pullquote footer,.wp-block-pullquote__citation{color:currentColor;font-size:.8125em;font-style:normal;text-transform:uppercase}.wp-block-quote{border-left:.25em solid;margin:0 0 1.75em;padding-left:1em}.wp-block-quote cite,.wp-block-quote footer{color:currentColor;font-size:.8125em;font-style:normal;position:relative}.wp-block-quote.has-text-align-right{border-left:none;border-right:.25em solid;padding-left:0;padding-right:1em}.wp-block-quote.has-text-align-center{border:none;padding-left:0}.wp-block-quote.is-large,.wp-block-quote.is-style-large,.wp-block-quote.is-style-plain{border:none}.wp-block-search .wp-block-search__label{font-weight:700}.wp-block-search__button{border:1px solid #ccc;padding:.375em .625em}:where(.wp-block-group.has-background){padding:1.25em 2.375em}.wp-block-separator.has-css-opacity{opacity:.4}.wp-block-separator{border:none;border-bottom:2px solid;margin-left:auto;margin-right:auto}.wp-block-separator.has-alpha-channel-opacity{opacity:1}.wp-block-separator:not(.is-style-wide):not(.is-style-dots){width:100px}.wp-block-separator.has-background:not(.is-style-dots){border-bottom:none;height:1px}.wp-block-separator.has-background:not(.is-style-wide):not(.is-style-dots){height:2px}.wp-block-table{margin:0 0 1em}.wp-block-table td,.wp-block-table th{word-break:normal}.wp-block-table :where(figcaption){color:#555;font-size:13px;text-align:center}.is-dark-theme .wp-block-table :where(figcaption){color:#ffffffa6}.wp-block-video :where(figcaption){color:#555;font-size:13px;text-align:center}.is-dark-theme .wp-block-video :where(figcaption){color:#ffffffa6}.wp-block-video{margin:0 0 1em}:root :where(.wp-block-template-part.has-background){margin-bottom:0;margin-top:0;padding:1.25em 2.375em} </style> <style id='safe-svg-svg-icon-style-inline-css' type='text/css'> .safe-svg-cover{text-align:center}.safe-svg-cover .safe-svg-inside{display:inline-block;max-width:100%}.safe-svg-cover svg{height:100%;max-height:100%;max-width:100%;width:100%} </style> <style id='classic-theme-styles-inline-css' type='text/css'> /*! This file is auto-generated */ .wp-block-button__link{color:#fff;background-color:#32373c;border-radius:9999px;box-shadow:none;text-decoration:none;padding:calc(.667em + 2px) calc(1.333em + 2px);font-size:1.125em}.wp-block-file__button{background:#32373c;color:#fff;text-decoration:none} </style> <style id='global-styles-inline-css' type='text/css'> :root{--wp--preset--aspect-ratio--square: 1;--wp--preset--aspect-ratio--4-3: 4/3;--wp--preset--aspect-ratio--3-4: 3/4;--wp--preset--aspect-ratio--3-2: 3/2;--wp--preset--aspect-ratio--2-3: 2/3;--wp--preset--aspect-ratio--16-9: 16/9;--wp--preset--aspect-ratio--9-16: 9/16;--wp--preset--color--black: #000000;--wp--preset--color--cyan-bluish-gray: #abb8c3;--wp--preset--color--white: #ffffff;--wp--preset--color--pale-pink: #f78da7;--wp--preset--color--vivid-red: #cf2e2e;--wp--preset--color--luminous-vivid-orange: #ff6900;--wp--preset--color--luminous-vivid-amber: #fcb900;--wp--preset--color--light-green-cyan: #7bdcb5;--wp--preset--color--vivid-green-cyan: #00d084;--wp--preset--color--pale-cyan-blue: #8ed1fc;--wp--preset--color--vivid-cyan-blue: #0693e3;--wp--preset--color--vivid-purple: #9b51e0;--wp--preset--color--eeee-22: #eeee22;--wp--preset--color--81-d-742: #81d742;--wp--preset--color--1-e-73-be: #1e73be;--wp--preset--color--8224-e-3: #8224e3;--wp--preset--color--6-b-6-b-6-b: #6b6b6b;--wp--preset--gradient--vivid-cyan-blue-to-vivid-purple: linear-gradient(135deg,rgba(6,147,227,1) 0%,rgb(155,81,224) 100%);--wp--preset--gradient--light-green-cyan-to-vivid-green-cyan: linear-gradient(135deg,rgb(122,220,180) 0%,rgb(0,208,130) 100%);--wp--preset--gradient--luminous-vivid-amber-to-luminous-vivid-orange: linear-gradient(135deg,rgba(252,185,0,1) 0%,rgba(255,105,0,1) 100%);--wp--preset--gradient--luminous-vivid-orange-to-vivid-red: linear-gradient(135deg,rgba(255,105,0,1) 0%,rgb(207,46,46) 100%);--wp--preset--gradient--very-light-gray-to-cyan-bluish-gray: linear-gradient(135deg,rgb(238,238,238) 0%,rgb(169,184,195) 100%);--wp--preset--gradient--cool-to-warm-spectrum: linear-gradient(135deg,rgb(74,234,220) 0%,rgb(151,120,209) 20%,rgb(207,42,186) 40%,rgb(238,44,130) 60%,rgb(251,105,98) 80%,rgb(254,248,76) 100%);--wp--preset--gradient--blush-light-purple: linear-gradient(135deg,rgb(255,206,236) 0%,rgb(152,150,240) 100%);--wp--preset--gradient--blush-bordeaux: linear-gradient(135deg,rgb(254,205,165) 0%,rgb(254,45,45) 50%,rgb(107,0,62) 100%);--wp--preset--gradient--luminous-dusk: linear-gradient(135deg,rgb(255,203,112) 0%,rgb(199,81,192) 50%,rgb(65,88,208) 100%);--wp--preset--gradient--pale-ocean: linear-gradient(135deg,rgb(255,245,203) 0%,rgb(182,227,212) 50%,rgb(51,167,181) 100%);--wp--preset--gradient--electric-grass: linear-gradient(135deg,rgb(202,248,128) 0%,rgb(113,206,126) 100%);--wp--preset--gradient--midnight: linear-gradient(135deg,rgb(2,3,129) 0%,rgb(40,116,252) 100%);--wp--preset--font-size--small: 13px;--wp--preset--font-size--medium: 20px;--wp--preset--font-size--large: 36px;--wp--preset--font-size--x-large: 42px;--wp--preset--spacing--20: 0.44rem;--wp--preset--spacing--30: 0.67rem;--wp--preset--spacing--40: 1rem;--wp--preset--spacing--50: 1.5rem;--wp--preset--spacing--60: 2.25rem;--wp--preset--spacing--70: 3.38rem;--wp--preset--spacing--80: 5.06rem;--wp--preset--shadow--natural: 6px 6px 9px rgba(0, 0, 0, 0.2);--wp--preset--shadow--deep: 12px 12px 50px rgba(0, 0, 0, 0.4);--wp--preset--shadow--sharp: 6px 6px 0px rgba(0, 0, 0, 0.2);--wp--preset--shadow--outlined: 6px 6px 0px -3px rgba(255, 255, 255, 1), 6px 6px rgba(0, 0, 0, 1);--wp--preset--shadow--crisp: 6px 6px 0px rgba(0, 0, 0, 1);}:where(.is-layout-flex){gap: 0.5em;}:where(.is-layout-grid){gap: 0.5em;}body .is-layout-flex{display: flex;}.is-layout-flex{flex-wrap: wrap;align-items: center;}.is-layout-flex > :is(*, div){margin: 0;}body .is-layout-grid{display: grid;}.is-layout-grid > :is(*, div){margin: 0;}:where(.wp-block-columns.is-layout-flex){gap: 2em;}:where(.wp-block-columns.is-layout-grid){gap: 2em;}:where(.wp-block-post-template.is-layout-flex){gap: 1.25em;}:where(.wp-block-post-template.is-layout-grid){gap: 1.25em;}.has-black-color{color: var(--wp--preset--color--black) !important;}.has-cyan-bluish-gray-color{color: var(--wp--preset--color--cyan-bluish-gray) !important;}.has-white-color{color: var(--wp--preset--color--white) !important;}.has-pale-pink-color{color: var(--wp--preset--color--pale-pink) !important;}.has-vivid-red-color{color: var(--wp--preset--color--vivid-red) !important;}.has-luminous-vivid-orange-color{color: var(--wp--preset--color--luminous-vivid-orange) !important;}.has-luminous-vivid-amber-color{color: var(--wp--preset--color--luminous-vivid-amber) !important;}.has-light-green-cyan-color{color: var(--wp--preset--color--light-green-cyan) !important;}.has-vivid-green-cyan-color{color: var(--wp--preset--color--vivid-green-cyan) !important;}.has-pale-cyan-blue-color{color: var(--wp--preset--color--pale-cyan-blue) !important;}.has-vivid-cyan-blue-color{color: var(--wp--preset--color--vivid-cyan-blue) !important;}.has-vivid-purple-color{color: var(--wp--preset--color--vivid-purple) !important;}.has-black-background-color{background-color: var(--wp--preset--color--black) !important;}.has-cyan-bluish-gray-background-color{background-color: var(--wp--preset--color--cyan-bluish-gray) !important;}.has-white-background-color{background-color: var(--wp--preset--color--white) !important;}.has-pale-pink-background-color{background-color: var(--wp--preset--color--pale-pink) !important;}.has-vivid-red-background-color{background-color: var(--wp--preset--color--vivid-red) !important;}.has-luminous-vivid-orange-background-color{background-color: var(--wp--preset--color--luminous-vivid-orange) !important;}.has-luminous-vivid-amber-background-color{background-color: var(--wp--preset--color--luminous-vivid-amber) !important;}.has-light-green-cyan-background-color{background-color: var(--wp--preset--color--light-green-cyan) !important;}.has-vivid-green-cyan-background-color{background-color: var(--wp--preset--color--vivid-green-cyan) !important;}.has-pale-cyan-blue-background-color{background-color: var(--wp--preset--color--pale-cyan-blue) !important;}.has-vivid-cyan-blue-background-color{background-color: var(--wp--preset--color--vivid-cyan-blue) !important;}.has-vivid-purple-background-color{background-color: var(--wp--preset--color--vivid-purple) !important;}.has-black-border-color{border-color: var(--wp--preset--color--black) !important;}.has-cyan-bluish-gray-border-color{border-color: var(--wp--preset--color--cyan-bluish-gray) !important;}.has-white-border-color{border-color: var(--wp--preset--color--white) !important;}.has-pale-pink-border-color{border-color: var(--wp--preset--color--pale-pink) !important;}.has-vivid-red-border-color{border-color: var(--wp--preset--color--vivid-red) !important;}.has-luminous-vivid-orange-border-color{border-color: var(--wp--preset--color--luminous-vivid-orange) !important;}.has-luminous-vivid-amber-border-color{border-color: var(--wp--preset--color--luminous-vivid-amber) !important;}.has-light-green-cyan-border-color{border-color: var(--wp--preset--color--light-green-cyan) !important;}.has-vivid-green-cyan-border-color{border-color: var(--wp--preset--color--vivid-green-cyan) !important;}.has-pale-cyan-blue-border-color{border-color: var(--wp--preset--color--pale-cyan-blue) !important;}.has-vivid-cyan-blue-border-color{border-color: var(--wp--preset--color--vivid-cyan-blue) !important;}.has-vivid-purple-border-color{border-color: var(--wp--preset--color--vivid-purple) !important;}.has-vivid-cyan-blue-to-vivid-purple-gradient-background{background: var(--wp--preset--gradient--vivid-cyan-blue-to-vivid-purple) !important;}.has-light-green-cyan-to-vivid-green-cyan-gradient-background{background: var(--wp--preset--gradient--light-green-cyan-to-vivid-green-cyan) !important;}.has-luminous-vivid-amber-to-luminous-vivid-orange-gradient-background{background: var(--wp--preset--gradient--luminous-vivid-amber-to-luminous-vivid-orange) !important;}.has-luminous-vivid-orange-to-vivid-red-gradient-background{background: var(--wp--preset--gradient--luminous-vivid-orange-to-vivid-red) !important;}.has-very-light-gray-to-cyan-bluish-gray-gradient-background{background: var(--wp--preset--gradient--very-light-gray-to-cyan-bluish-gray) !important;}.has-cool-to-warm-spectrum-gradient-background{background: var(--wp--preset--gradient--cool-to-warm-spectrum) !important;}.has-blush-light-purple-gradient-background{background: var(--wp--preset--gradient--blush-light-purple) !important;}.has-blush-bordeaux-gradient-background{background: var(--wp--preset--gradient--blush-bordeaux) !important;}.has-luminous-dusk-gradient-background{background: var(--wp--preset--gradient--luminous-dusk) !important;}.has-pale-ocean-gradient-background{background: var(--wp--preset--gradient--pale-ocean) !important;}.has-electric-grass-gradient-background{background: var(--wp--preset--gradient--electric-grass) !important;}.has-midnight-gradient-background{background: var(--wp--preset--gradient--midnight) !important;}.has-small-font-size{font-size: var(--wp--preset--font-size--small) !important;}.has-medium-font-size{font-size: var(--wp--preset--font-size--medium) !important;}.has-large-font-size{font-size: var(--wp--preset--font-size--large) !important;}.has-x-large-font-size{font-size: var(--wp--preset--font-size--x-large) !important;} :where(.wp-block-post-template.is-layout-flex){gap: 1.25em;}:where(.wp-block-post-template.is-layout-grid){gap: 1.25em;} :where(.wp-block-columns.is-layout-flex){gap: 2em;}:where(.wp-block-columns.is-layout-grid){gap: 2em;} :root :where(.wp-block-pullquote){font-size: 1.5em;line-height: 1.6;} </style> <link rel='stylesheet' id='contact-form-7-css' href='https://dagshub.com/wp-content/plugins/contact-form-7/includes/css/styles.css?ver=5.9.8' type='text/css' media='all' /> <link rel='stylesheet' id='styles-css' href='https://dagshub.com/wp-content/themes/wp-d-theme/css/prod/main.css?ver=1732811207' type='text/css' media='all' /> <link rel='stylesheet' id='new-style-css' href='https://dagshub.com/wp-content/themes/wp-d-theme/css/prod/new-style.css?ver=1732811209' type='text/css' media='all' /> <link rel='stylesheet' id='main-theme-style-css' href='https://dagshub.com/wp-content/themes/wp-d-theme/style.css?ver=1724943191' type='text/css' media='all' /> <link rel='stylesheet' id='fancybox-css' href='https://dagshub.com/wp-content/themes/wp-d-theme/vendors/fancybox/fancybox.css?ver=4.0.31' type='text/css' media='all' /> <link rel="https://api.w.org/" href="https://dagshub.com/wp-json/" /><link rel="alternate" title="JSON" type="application/json" href="https://dagshub.com/wp-json/wp/v2/datasets/1256" /><link rel="EditURI" type="application/rsd+xml" title="RSD" href="https://dagshub.com/xmlrpc.php?rsd" /> <link rel='shortlink' href='https://dagshub.com/?p=1256' /> <link rel="alternate" title="oEmbed (JSON)" type="application/json+oembed" href="https://dagshub.com/wp-json/oembed/1.0/embed?url=https%3A%2F%2Fdagshub.com%2Fdatasets%2Fjapanese-tokenizer-dictionaries%2F" /> <link rel="alternate" title="oEmbed (XML)" type="text/xml+oembed" href="https://dagshub.com/wp-json/oembed/1.0/embed?url=https%3A%2F%2Fdagshub.com%2Fdatasets%2Fjapanese-tokenizer-dictionaries%2F&format=xml" /> <!-- Google Tag Manager --> <script>(function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start': new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0], j=d.createElement(s),dl=l!='dataLayer'?'&l='+l:'';j.async=true;j.src= 'https://www.googletagmanager.com/gtm.js?id='+i+dl;f.parentNode.insertBefore(j,f); })(window,document,'script','dataLayer','GTM-PGHTMDN');</script> <!-- End Google Tag Manager --> <link rel="icon" href="https://dagshub.com/wp-content/uploads/2023/01/cropped-DH-Logo-512x512-3-32x32.png" sizes="32x32" /> <link rel="icon" href="https://dagshub.com/wp-content/uploads/2023/01/cropped-DH-Logo-512x512-3-192x192.png" sizes="192x192" /> <link rel="apple-touch-icon" href="https://dagshub.com/wp-content/uploads/2023/01/cropped-DH-Logo-512x512-3-180x180.png" /> <meta name="msapplication-TileImage" content="https://dagshub.com/wp-content/uploads/2023/01/cropped-DH-Logo-512x512-3-270x270.png" /> <style id="wp-custom-css"> .c-glossary__thumb{ top:0px; left:0px; } .header__actions .c-buttons { margin-top: 0; } .grecaptcha-badge{ visibility: hidden; } .home .site-head{ background-color:rgba(0,0,0,.0); } body:not(.home){ margin-top:68px; } body .site .main { padding-top: 0; } body:not(.home) .site { padding-top: 0px; } .home .site-head.site-head__scrolled{ background-color:#090819; } .logos-gallery .main-gallery .main-gallery__row .gallery-item img{ max-height:66px; max-width:155px; object-fit: contain; } #wpcf7-f2379-p2377-o1 .c-form-primary__field:has(.wpcf7-not-valid) .wpcf7-not-valid-tip { display: block; } @media only screen and (max-width: 1280px) { .logos-gallery .main-gallery .main-gallery__row .gallery-item img{ max-width:120px; max-height:55px; } } @media only screen and (max-width: 1199px) { .head-nav a:not(.btn) { display: block; } .head-nav a:not(.btn) .menu-item__text{ display:block; } .head-nav .sub-menu a:not(.btn) .menu-item__text{ display:inline-flex; } } @media only screen and (max-width: 1026px) { .canvas-animation--bg, .canvas-animation--bg canvas{ pointer-events:none; } .logos-gallery .main-gallery .main-gallery__row .gallery-item img{ max-width:90px; max-height:40px; } .home-hero-block .title__gradient div { -webkit-text-fill-color: #0000; background: linear-gradient(180deg, #fff 17.78%, #ffffff1a 191.11%); background-clip: text; -webkit-background-clip: text; pointer-events: none; } } @media only screen and (min-width: 1441px) { .site-head__nav { margin-right: auto; margin-right: auto; } } </style> </head> <body class="datasets-template-default single single-datasets postid-1256 wp-custom-logo no-js"> <a class="skip-link screen-reader-text js-trigger" href="#content">Skip to content</a> <!-- Google Tag Manager (noscript) --> <noscript><iframe src="https://www.googletagmanager.com/ns.html?id=GTM-PGHTMDN" height="0" width="0" style="display:none;visibility:hidden"></iframe></noscript> <!-- End Google Tag Manager (noscript) --> <div id="page" class="site"> <header class="site-head site-head__bacground" role="banner" itemscope="itemscope" itemtype="http://schema.org/WPHeader"> <div class="site-head__wrap"> <div class="container container-lg"> <div class="site-head__frame"> <!-- Custom logo and site title. --> <div class="site-logo"> <a href="https://dagshub.com/" class="custom-logo-link" rel="home"><img width="143" height="40" src="https://dagshub.com/wp-content/uploads/2024/04/dagshab.svg" class="custom-logo" alt="DagsHub" decoding="async" /></a> <span class="screen-reader-text" itemprop="name">DagsHub</span> </div> <button class="nav-opener" aria-label="nav opener"><span><em>Menu</em></span></button> <div class="site-head__holder"> <!-- Main menu. --> <nav class="site-head__nav js-header-menu-item" role="navigation" itemscope="itemscope" itemtype="http://schema.org/SiteNavigationElement"> <ul class="menu head-nav main-header-menu"><li id="menu-item-2351" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-has-children menu-item-2351"> <div class="menu-item__link menu-item__link--title">Resources</div> <button class="dropdown-toggle" aria-expanded="false"><span class="screen-readers">Expand child menu</span><span class="opener-arrow"><svg class="svg-icon icon-chevron-down" width="20" height="20""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-chevron-down"></use></svg></span></button> <ul class="sub-menu level0"> <li id="menu-item-2357" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2357"> <a href="https://dagshub.com/blog/" class="menu-item__link" ><span class="menu-item__text">Blog</span></a> </li> <li id="menu-item-2358" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2358"> <a href="https://dagshub.com/datasets/" class="menu-item__link" ><span class="menu-item__text">Datasets</span></a> </li> <li id="menu-item-2359" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2359"> <a href="https://dagshub.com/glossary/" class="menu-item__link" ><span class="menu-item__text">Glossary</span></a> </li> <li id="menu-item-2360" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2360"> <a href="https://dagshub.com/blog/tag/tutorials/" class="menu-item__link" ><span class="menu-item__text">Tutorial & Webinars</span></a> </li> </ul> </li> <li id="menu-item-2352" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2352"> <a href="https://dagshub.com/docs" class="menu-item__link" ><span class="menu-item__text">Docs</span></a> </li> <li id="menu-item-2353" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-has-children menu-item-2353"> <div class="menu-item__link menu-item__link--title">Product</div> <button class="dropdown-toggle" aria-expanded="false"><span class="screen-readers">Expand child menu</span><span class="opener-arrow"><svg class="svg-icon icon-chevron-down" width="20" height="20""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-chevron-down"></use></svg></span></button> <ul class="sub-menu level0"> <li id="menu-item-2361" class="menu-item menu-item-type-post_type menu-item-object-page menu-item-2361"> <a href="https://dagshub.com/data-engine/" class="menu-item__link" ><span class="menu-item__text"><span class="icon-image"><svg class="svg-icon icon-data-engine" width="20" height="20""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-data-engine"></use></svg></span><span class="menu-text-wrapper"><span class="menu-text">Data engine</span><span class="menu-description">Manage your unstructured data</span></span></span></a> </li> <li id="menu-item-2362" class="menu-item menu-item-type-post_type menu-item-object-page menu-item-2362"> <a href="https://dagshub.com/use-cases/llm/" class="menu-item__link" ><span class="menu-item__text"><span class="icon-image"><svg class="svg-icon icon-llms" width="20" height="20""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-llms"></use></svg></span><span class="menu-text-wrapper"><span class="menu-text">LLMs</span><span class="menu-description">Build LLM projects quickly</span></span></span></a> </li> <li id="menu-item-2363" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2363"> <a href="https://dagshub.com/product/" class="menu-item__link" ><span class="menu-item__text"><span class="icon-image"><svg class="svg-icon icon-linear-search" width="20" height="20""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-linear-search"></use></svg></span><span class="menu-text-wrapper"><span class="menu-text">Overview</span><span class="menu-description">Organize your entire project under one roof</span></span></span></a> </li> <li id="menu-item-2364" class="menu-item menu-item-type-post_type menu-item-object-page menu-item-2364"> <a href="https://dagshub.com/enterprise/" class="menu-item__link" ><span class="menu-item__text"><span class="icon-image"><svg class="svg-icon icon-enterprise" width="20" height="20""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-enterprise"></use></svg></span><span class="menu-text-wrapper"><span class="menu-text">Enterprise</span><span class="menu-description">A single source of truth for your organization</span></span></span></a> </li> </ul> </li> <li id="menu-item-2354" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2354"> <a href="/enterprise/" class="menu-item__link" ><span class="menu-item__text">Enterprise</span></a> </li> <li id="menu-item-2355" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2355"> <a href="https://dagshub.com/pricing" class="menu-item__link" ><span class="menu-item__text">Pricing</span></a> </li> <li id="menu-item-2356" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-has-children menu-item-2356"> <div class="menu-item__link menu-item__link--title">Company</div> <button class="dropdown-toggle" aria-expanded="false"><span class="screen-readers">Expand child menu</span><span class="opener-arrow"><svg class="svg-icon icon-chevron-down" width="20" height="20""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-chevron-down"></use></svg></span></button> <ul class="sub-menu level0"> <li id="menu-item-2365" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2365"> <a href="https://dagshub.com/about" class="menu-item__link" ><span class="menu-item__text">About</span></a> </li> <li id="menu-item-2366" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2366"> <a href="https://dagshub.com/careers" class="menu-item__link" ><span class="menu-item__text">Careers</span></a> </li> <li id="menu-item-2367" class="menu-item menu-item-type-post_type menu-item-object-page menu-item-2367"> <a href="https://dagshub.com/contact-us/" class="menu-item__link" ><span class="menu-item__text">Contact us</span></a> </li> </ul> </li> </ul> </nav> <div class="site-head__tools"> <ul class="menu head-nav main-header-menu"><li id="menu-item-2372" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2372"><a rel="Navbar_Login_Clicked" href="https://dagshub.com/user/login" class="menu-item__link">Log in</a></li> <li id="menu-item-2389" class="menu-item menu-item-type-post_type menu-item-object-page menu-item-2389"><a rel="Navbar_BookADemo_Clicked" href="https://dagshub.com/book-a-demo/" class="menu-item__button btn btn--primary"><span class="btn__text">Book a demo</span></a></li> </ul> </div> </div> </div> </div> </div> </header> <div class="wrapper__body no-overlap"> <main class="main"> <article class="c-block b-block-single"> <header class="b-block-single__head"> <img width="1816" height="300" src="https://dagshub.com/wp-content/uploads/2023/01/milad-fakurian-PGdW_bHDbpI-unsplash-1.png" class="b-block-single__thumbnail" alt="" decoding="async" fetchpriority="high" srcset="https://dagshub.com/wp-content/uploads/2023/01/milad-fakurian-PGdW_bHDbpI-unsplash-1.png 1816w, https://dagshub.com/wp-content/uploads/2023/01/milad-fakurian-PGdW_bHDbpI-unsplash-1-300x50.png 300w, https://dagshub.com/wp-content/uploads/2023/01/milad-fakurian-PGdW_bHDbpI-unsplash-1-1024x169.png 1024w, https://dagshub.com/wp-content/uploads/2023/01/milad-fakurian-PGdW_bHDbpI-unsplash-1-768x127.png 768w" sizes="(max-width: 1816px) 100vw, 1816px" /> <div class="b-block-single__head-image-author"> <p>Photo by <a href="https://unsplash.com/@fakurian?utm_source=unsplash&utm_medium=referral&utm_content=creditCopyText">Milad Fakurian</a> on <a href="https://unsplash.com/wallpapers/screen/3d?utm_source=unsplash&utm_medium=referral&utm_content=creditCopyText">Unsplash</a></p> </div> </header> <div class="b-block-single__container"> <div class="container container--small"> <div class="b-block-single__actions"> <div class="c-breadcrumbs"> <p class="breadcrumbs"><span><span><a href="https://dagshub.com/datasets/">Datasets</a></span> 禄 <span><a href="https://dagshub.com/datasets/nlp/">NLP</a></span> 禄 <span class="breadcrumb_last" aria-current="page">Japanese Tokenizer Dictionaries</span></span></p></div> </div> <h1 class="b-block-single__title">Japanese Tokenizer Dictionaries Dataset for Machine Learning</h1> <ul class="c-list-categories"> <li class="c-list-categories__item"><a class="c-list-categories__link" href="https://dagshub.com/datasets/nlp/">NLP</a></li> <li class="c-list-categories__item"><a class="c-list-categories__link" href="https://dagshub.com/datasets/tabular/">Tabular</a></li> </ul> </div> <div class="b-block-single__middle"> <div class="container container--small"> <div class="b-block-single__content"> <div class="c-code"> <h3 class="c-code__title">Install DagsHub:</h3> <div class="c-code__body"> <pre class="c-code__preview"><code class="language-python">pip install dagshub</code></pre> <div class="c-code__overlay"> Click on copy button to copy content </div> <button class="c-btn c-btn-ghost c-code__copy" data-repo-id="InstallDagshub" data-analytics-event="CopySnippet_Clicked" data-current="Copy" data-active="Copied"><span aria-hidden="true">Copy</span></button> </div> </div> <div class="c-code"> <h3 class="c-code__title">To stream this data directly on DagsHub</h3> <div class="c-code__body"> <pre class="c-code__preview"><code class="language-python">from dagshub.streaming import DagsHubFilesystem fs = DagsHubFilesystem(".", repo_url="https://dagshub.com/DagsHub-Datasets/cotonoha-dic-dataset") fs.listdir("s3://cotonoha-dic")</code></pre> <div class="c-code__overlay"> Click on copy button to copy content </div> <button class="c-btn c-btn-ghost c-code__copy" data-repo-id="243" data-analytics-event="CopySnippet_Clicked" data-current="Copy" data-active="Copied"><span aria-hidden="true">Copy</span></button> </div> </div> <div class="c-entry"> <div class="c-dataset c-dataset--description-wrapper"> <h2>Description</h2> <div class="c-dataset c-dataset--description-wrapper__text"> <p>Japanese Tokenizer Dictionaries for use with MeCab.</p> </div> </div> <div class="c-dataset c-dataset--cta-wrapper"> <a class="c-btn c-btn-primary c-btn-suffix-none" data-analytics-event="ExploreLink_Clicked" data-repo-id="243" target="_blank" href="https://dagshub.com/DagsHub-Datasets/cotonoha-dic-dataset">Explore this dataset on DagsHub</a> </div> <h2>Additional information</h2> <div class="c-dataset c-dataset--documentation-wrapper"> <h3>Documentation</h3> <div class="c-dataset c-dataset--documentation-wrapper__text"> <p>This dataset includes dictionaries for tokenization and morphological<br /> analysis of Japanese for use with MeCab. This includes NINJAL’s UniDic, a<br /> modified smaller version of UniDic for situations that require it, and the<br /> legacy IPADic dictionary.</p> </div> </div> <div class="c-dataset c-dataset--update_frequency-wrapper"> <h3>Update frequency</h3> <div class="c-dataset c-dataset--update_frequency-wrapper__text"> <p>Infrequently (typically less than once a year)</p> </div> </div> <div class="c-dataset c-dataset--managed_by-wrapper"> <h3>Managed by</h3> <div class="c-dataset c-dataset--managed_by-wrapper__text"> <p>Cotonoha</p> </div> </div> <div class="c-dataset c-dataset--license-wrapper"> <h3>License</h3> <div class="c-dataset c-dataset--license-wrapper__text"> <p>Versions of Unidic offered here are available under the GPL/LGPL/BSD license.</p> <p>IPADic is offered under a unique BSD-like license. See below. </p> <p> <a href="https://github.com/polm/ipadic-py/blob/master/ipadic/dicdir/COPYING">https://github.com/polm/ipadic-py/blob/master/ipadic/dicdir/COPYING</a></p> </div> </div> <div class="c-dataset c-dataset--cta-wrapper"> <a class="c-btn c-btn-primary c-btn-suffix-none" data-analytics-event="ExploreLink_Clicked" data-repo-id="243" target="_blank" href="https://dagshub.com/DagsHub-Datasets/cotonoha-dic-dataset">Explore this dataset on DagsHub</a> </div> <div class="the-content "> </div> </div> <div class="c-list-tags"> <h3 class="c-list-tags__title">Tags</h3> <ul class="c-list-tags__list"> <li class="c-list-tags__item"><a class="c-list-tags__link" href="https://dagshub.com/datasets/tags/aws-pds/">aws-pds</a></li> <li class="c-list-tags__item"><a class="c-list-tags__link" href="https://dagshub.com/datasets/tags/csv/">csv</a></li> <li class="c-list-tags__item"><a class="c-list-tags__link" href="https://dagshub.com/datasets/tags/japanese/">japanese</a></li> <li class="c-list-tags__item"><a class="c-list-tags__link" href="https://dagshub.com/datasets/tags/natural-language-processing/">natural language processing</a></li> </ul> </div> </div> </div> </div> </div> </article> <div class="b-item-and-cta c-block"> <div class="container"> <div class="c-posts-alt"> <div class="c-posts-alt__head"> <h2 class="c-title c-posts-alt__title default" > Related datasets<br /> </h2> </div> <div class="c-posts-alt__body"> <article class="c-post-item c-post-item--id-1276 c-post-item--type-datasets c-post-item c-post-item--alt" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="Related_datasets_Clicked" data-repo-id="263" href="https://dagshub.com/datasets/common-screens/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Common Screens </h2> </div> </article> <article class="c-post-item c-post-item--id-1345 c-post-item--type-datasets c-post-item c-post-item--alt" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="Related_datasets_Clicked" data-repo-id="332" href="https://dagshub.com/datasets/helpful-sentences-from-reviews/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Helpful Sentences from Reviews </h2> </div> </article> <article class="c-post-item c-post-item--id-1136 c-post-item--type-datasets c-post-item c-post-item--alt" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="Related_datasets_Clicked" data-repo-id="123" href="https://dagshub.com/datasets/humor-detection-from-product-question-answering-systems/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Humor Detection from Product Question Answering Systems </h2> </div> </article> <article class="c-post-item c-post-item--id-1256 c-post-item--type-datasets c-post-item c-post-item--alt" style="color:#7f1d1d;background: linear-gradient(180deg, #FEF2F2 0%, #FEE2E2 100%), linear-gradient(180deg, #FEFCE8 0%, #FEF9C3 100%);"> <a class="c-post-item__link" data-analytics-event="Related_datasets_Clicked" data-repo-id="243" href="https://dagshub.com/datasets/japanese-tokenizer-dictionaries/"></a> <div class="c-post-item__body"> <h2 class="c-post-item__title"> Japanese Tokenizer Dictionaries </h2> </div> </article> </div> </div> <section id="b-oob-cta-691298" class="c-block b-block b-oob-cta b-oob b-oob-cta--layout-default c-block--padding-default b-oob--style-boxed-container "> <div class="c-background "> <div class="c-background__media"> <div class=" c-media " > <div class="c-media__element c-media__element--type-lottie c-media__element--all" style="top:0;bottom:0;"> <dotlottie-player class="c-lottie " data-offset="500" autoplay data-src="https://dagshub.com/wp-content/uploads/2023/01/20230212-093145lf30_editor_b9vmxals.lottie" data-replay="true" ></dotlottie-player> </div> </div> </div> <div class="c-background__overlay-color" style="background-color: rgba(7,0,17,0.09)"></div> <div class="container c-block__content"> <div class="b-oob-cta b-oob-inner"> <div class="c-cta c-cta--id-149 c-cta--style-default"> <div class="c-cta__inner"> <div class="c-cta__col c-cta__col--body"> <div class="c-section-header c-section-header--align- "> <h2 class="c-title c-section-header__title default" style="color: #ffffff !important" > Launch your ML development to new heights with DagsHub<br /> </h2> </div> </div> <div class="c-cta__col c-cta__col--action"> <div class="c-buttons-or-form "> <ul class="c-buttons "> <li class="c-button testimonials-section__bottom-action c-button--type-link c-button__style--primary"> <a data-analytics-event="DataSet Page SignUp CTA Clicked" class="c-btn c-btn-primary" href="https://dagshub.com/user/sign_up?redirect_to=" target="_self" title="Get started – it’s free! "> Get started – it’s free! </a> </li> </ul> </div> </div> </div> </div> </div> </div> </div></section> </div> </div> </main> </div><!-- #content --> <div class="site-pre-footer"> <div class="container"> <div class="content-wrapper"> <h3 class="title"> Manage your unstructured data. Scale to millions of experiments today. </h3> <p class="description">See how leading data scientists manage their data.</p> <div class="button-group"> <a href="/book-a-demo/" target="" class="btn btn__lg btn--primary" data-analytics-event="Footer_StartFree_Clicked">Book A Demo</a> </div> </div> </div> </div> <div class="site-footer"> <div class="container"> <div class="site-footer__wrap"> <div class="site-footer__logo"> <div class="site-logo"> <a href="https://dagshub.com/" class="custom-logo-link" rel="home"><img width="143" height="40" src="https://dagshub.com/wp-content/uploads/2024/04/dagshab.svg" class="custom-logo" alt="DagsHub" decoding="async" /></a> </div> <div class="site-footer__social"> <!-- <h3 class="wdiget-title">Follow us</h3> --> <ul class="social-list"> <li class="social-list__item"> <a href="https://twitter.com/TheRealDAGsHub" target="_blank" class="social-list__link"><svg class="svg-icon icon-twitter" width="18" height="18""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-twitter"></use></svg><span class="screen-reader-text"></span></a> </li> <li class="social-list__item"> <a href="https://www.linkedin.com/company/dagshub" target="_blank" class="social-list__link"><svg class="svg-icon icon-linkedin" width="18" height="18""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-linkedin"></use></svg><span class="screen-reader-text"></span></a> </li> <li class="social-list__item"> <a href="https://youtube.com/c/dagshub" target="_blank" class="social-list__link"><svg class="svg-icon icon-youtube" width="18" height="18""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-youtube"></use></svg><span class="screen-reader-text"></span></a> </li> <li class="social-list__item"> <a href="https://discord.com/invite/9gU36Y6" target="_blank" class="social-list__link"><svg class="svg-icon icon-discord" width="18" height="18""><use xlink:href="https://dagshub.com/wp-content/themes/wp-d-theme/images/icons.svg?ver=1724154108#icon-discord"></use></svg><span class="screen-reader-text"></span></a> </li> </ul> </div> <img src="https://dagshub.com/wp-content/uploads/2024/04/image-54.png" alt="" class="bottom_logo"/> </div> <div class="site-footer__frame"> <div class="site-footer__holder"> <div class="site-footer__nav"> <ul id="menu-pro-footer-menu" class="footer-nav"><li id="menu-item-14" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-has-children menu-item-14"><a>Resources</a> <ul class="sub-menu"> <li id="menu-item-15" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-15"><a href="https://dagshub.com/docs">Docs</a></li> <li id="menu-item-16" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-16"><a href="https://dagshub.com/blog">Blog</a></li> <li id="menu-item-101" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-101"><a href="/datasets/">Datasets</a></li> <li id="menu-item-1586" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-1586"><a href="/glossary/">Glossary</a></li> <li id="menu-item-2247" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2247"><a href="https://dagshub.com/blog/tag/case-study/">Case Studies</a></li> <li id="menu-item-2244" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2244"><a href="https://dagshub.com/blog/tag/tutorials/">Tutorials & Webinars</a></li> </ul> </li> <li id="menu-item-1708" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-has-children menu-item-1708"><a>Product</a> <ul class="sub-menu"> <li id="menu-item-2076" class="menu-item menu-item-type-post_type menu-item-object-page menu-item-2076"><a href="https://dagshub.com/data-engine/">Data Engine</a></li> <li id="menu-item-2250" class="menu-item menu-item-type-post_type menu-item-object-page menu-item-2250"><a href="https://dagshub.com/use-cases/llm/">LLMs</a></li> <li id="menu-item-1463" class="menu-item menu-item-type-post_type menu-item-object-page menu-item-1463"><a href="https://dagshub.com/product/">Platform</a></li> <li id="menu-item-1711" class="menu-item menu-item-type-post_type menu-item-object-page menu-item-1711"><a href="https://dagshub.com/enterprise/">Enterprise</a></li> <li id="menu-item-2464" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2464"><a href="https://dagshub.com/pricing">Pricing</a></li> </ul> </li> <li id="menu-item-2347" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-has-children menu-item-2347"><a>Company</a> <ul class="sub-menu"> <li id="menu-item-2348" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2348"><a href="https://dagshub.com/about">About</a></li> <li id="menu-item-2349" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-2349"><a href="https://dagshub.com/careers">Careers</a></li> <li id="menu-item-2350" class="menu-item menu-item-type-post_type menu-item-object-page menu-item-2350"><a href="https://dagshub.com/contact-us/">Contact us</a></li> </ul> </li> <li id="menu-item-18" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-has-children menu-item-18"><a>Community</a> <ul class="sub-menu"> <li id="menu-item-17" class="menu-item menu-item-type-custom menu-item-object-custom menu-item-17"><a href="https://dagshub.com/explore/repos">Explore</a></li> </ul> </li> </ul> </div> <div class="site-footer__info"> </div> </div> </div> <div class="footer_subcscription"> <div class="wpcf7 no-js" id="wpcf7-f2374-p1256-o1" lang="en-US" dir="ltr"> <div class="screen-reader-response"><p role="status" aria-live="polite" aria-atomic="true"></p> <ul></ul></div> <form action="/datasets/japanese-tokenizer-dictionaries/#wpcf7-f2374-p1256-o1" method="post" class="wpcf7-form init" aria-label="Contact form" novalidate="novalidate" data-status="init"> <div style="display: none;"> <input type="hidden" name="_wpcf7" value="2374" /> <input type="hidden" name="_wpcf7_version" value="5.9.8" /> <input type="hidden" name="_wpcf7_locale" value="en_US" /> <input type="hidden" name="_wpcf7_unit_tag" value="wpcf7-f2374-p1256-o1" /> <input type="hidden" name="_wpcf7_container_post" value="1256" /> <input type="hidden" name="_wpcf7_posted_data_hash" value="" /> <input type="hidden" name="_wpcf7_recaptcha_response" value="" /> </div> <div class="footer-subcription-box"> <h3 class="title">ML Newsletter</h3> <p class="description">Top MLOps articles, case studies, events (and more) in your inbox every month</p> <div class="form-wrap c-form-subscription"> <div class="c-form-primary__field"><span class="wpcf7-form-control-wrap" data-name="your-email"><input size="40" maxlength="400" class="wpcf7-form-control wpcf7-email wpcf7-validates-as-required wpcf7-text wpcf7-validates-as-email" autocomplete="email" aria-required="true" aria-invalid="false" placeholder="Email" value="" type="email" name="your-email" /></span></div> <input class="wpcf7-form-control wpcf7-submit has-spinner" type="submit" value="Subscribe" /> </div> <div id="customMessage" style="display: none;"> You're subscribed! Check your inbox for exciting updates! </div> </div><div class="wpcf7-response-output" aria-hidden="true"></div> </form> </div> </div> </div> <div class="site-footer__row"> <div class="site-footer__copy">©2024 漏 Copyright Dagshub 2023</div> </div> </div> <div class="elipse-background"></div> <div class="elipse-background right"></div> </div> </div> <div class="modal fade c-modal c-modal-default cf7-form-modal show" tabindex="-1" id="modal-1687"> <div class="modal-dialog"> <div class="modal-content"> <div class="modal-header"> Contact us </div> <div class="modal-body"> <div class="wpcf7 no-js" id="wpcf7-f1687-p1256-o2" lang="en-US" dir="ltr"> <div class="screen-reader-response"><p role="status" aria-live="polite" aria-atomic="true"></p> <ul></ul></div> <form action="/datasets/japanese-tokenizer-dictionaries/#wpcf7-f1687-p1256-o2" method="post" class="wpcf7-form init" aria-label="Contact form" novalidate="novalidate" data-status="init"> <div style="display: none;"> <input type="hidden" name="_wpcf7" value="1687" /> <input type="hidden" name="_wpcf7_version" value="5.9.8" /> <input type="hidden" name="_wpcf7_locale" value="en_US" /> <input type="hidden" name="_wpcf7_unit_tag" value="wpcf7-f1687-p1256-o2" /> <input type="hidden" name="_wpcf7_container_post" value="1256" /> <input type="hidden" name="_wpcf7_posted_data_hash" value="" /> <input type="hidden" name="_wpcf7_recaptcha_response" value="" /> </div> <div class="c-form-primary"> <div class="c-form-primary__row"> <div class="c-form-primary__field"> <label for="first-name" class="c-form-primary__label">First Name</label> <div class="c-form-primary__field-element"> <span class="wpcf7-form-control-wrap" data-name="first-name"><input size="40" maxlength="400" class="wpcf7-form-control wpcf7-text wpcf7-validates-as-required required" aria-required="true" aria-invalid="false" placeholder="Enter your first name here" value="" type="text" name="first-name" /></span> </div> </div> </div> <div class="c-form-primary__row"> <div class="c-form-primary__field"> <label for="last-name" class="c-form-primary__label">Last Name</label> <div class="c-form-primary__field-element"> <span class="wpcf7-form-control-wrap" data-name="last-name"><input size="40" maxlength="400" class="wpcf7-form-control wpcf7-text wpcf7-validates-as-required required" aria-required="true" aria-invalid="false" placeholder="Enter your last name here" value="" type="text" name="last-name" /></span> </div> </div> </div> <div class="c-form-primary__row"> <div class="c-form-primary__field"> <label for="clients-email" class="c-form-primary__label">Work email</label> <div class="c-form-primary__field-element"> <span class="wpcf7-form-control-wrap" data-name="clients-email"><input size="40" maxlength="400" class="wpcf7-form-control wpcf7-email wpcf7-validates-as-required wpcf7-text wpcf7-validates-as-email required" aria-required="true" aria-invalid="false" placeholder="Enter your work email here" value="" type="email" name="clients-email" /></span> </div> </div> </div> <div class="c-form-primary__row"> <div class="c-form-primary__field"> <label for="Company-name" class="c-form-primary__label">Company name</label> <div class="c-form-primary__field-element"> <span class="wpcf7-form-control-wrap" data-name="company-name"><input size="40" maxlength="400" class="wpcf7-form-control wpcf7-text wpcf7-validates-as-required required" aria-required="true" aria-invalid="false" placeholder="Enter your company name here" value="" type="text" name="company-name" /></span> </div> </div> </div> <div class="c-form-primary__row"> <div class="c-form-primary__field"> <label for="job-title" class="c-form-primary__label">Job title</label> <div class="c-form-primary__field-element"> <span class="wpcf7-form-control-wrap" data-name="job-title"><input size="40" maxlength="400" class="wpcf7-form-control wpcf7-text wpcf7-validates-as-required required" aria-required="true" aria-invalid="false" placeholder="Enter your job title here" value="" type="text" name="job-title" /></span> </div> </div> </div> <div class="c-form-primary__actions"> <input class="wpcf7-form-control wpcf7-submit has-spinner" type="submit" value="Request a demo" /> </div> </div><div class="wpcf7-response-output" aria-hidden="true"></div> </form> </div> </div> </div> </div> </div> <script src="https://dagshub.com/wp-includes/js/dist/hooks.min.js?ver=2810c76e705dd1a53b18" id="wp-hooks-js"></script> <script src="https://dagshub.com/wp-includes/js/dist/i18n.min.js?ver=5e580eb46a90c2b997e6" id="wp-i18n-js"></script> <script id="wp-i18n-js-after"> wp.i18n.setLocaleData( { 'text direction\u0004ltr': [ 'ltr' ] } ); </script> <script src="https://dagshub.com/wp-content/plugins/contact-form-7/includes/swv/js/index.js?ver=5.9.8" id="swv-js"></script> <script id="contact-form-7-js-extra"> var wpcf7 = {"api":{"root":"https:\/\/dagshub.com\/wp-json\/","namespace":"contact-form-7\/v1"},"cached":"1"}; </script> <script src="https://dagshub.com/wp-content/plugins/contact-form-7/includes/js/index.js?ver=5.9.8" id="contact-form-7-js"></script> <script src="https://dagshub.com/wp-includes/js/jquery/jquery.min.js?ver=3.7.1" id="jquery-core-js"></script> <script src="https://dagshub.com/wp-includes/js/jquery/jquery-migrate.min.js?ver=3.4.1" id="jquery-migrate-js"></script> <script src="https://dagshub.com/wp-content/themes/wp-d-theme/vendors/fancybox/fancybox.min.js?ver=4.0.31" id="fancybox-new-js-js"></script> <script src="https://dagshub.com/wp-content/themes/wp-d-theme/vendors/jquery.main.js?ver=1724154105" id="custom-js"></script> <script id="scripts-js-extra"> var air_light_screenReaderText = {"expand":"Open child menu","collapse":"Close child menu","expand_for":"Open child menu for","collapse_for":"Close child menu for","expand_toggle":"Open main menu","collapse_toggle":"Close main menu","external_link":"External site","target_blank":"opens in a new window","previous_slide":"Previous slide","next_slide":"Next slide","last_slide":"Last slide","skip_slider":"Skip over the carousel element"}; var air_light_externalLinkDomains = ["localhost:3000","airdev.test","airwptheme.com","localhost"]; </script> <script src="https://dagshub.com/wp-content/themes/wp-d-theme/js/prod/front-end.js?ver=1724154107" id="scripts-js"></script> <script src="https://dagshub.com/wp-includes/js/comment-reply.min.js?ver=4e55ae54fa701286f578c2d0b9d76284" id="comment-reply-js" async data-wp-strategy="async"></script> <script src="https://www.google.com/recaptcha/api.js?render=6LfHrukpAAAAAA9UYBYO1jTWc1qASGHFOc5xtGfG&ver=3.0" id="google-recaptcha-js"></script> <script src="https://dagshub.com/wp-includes/js/dist/vendor/wp-polyfill.min.js?ver=3.15.0" id="wp-polyfill-js"></script> <script id="wpcf7-recaptcha-js-extra"> var wpcf7_recaptcha = {"sitekey":"6LfHrukpAAAAAA9UYBYO1jTWc1qASGHFOc5xtGfG","actions":{"homepage":"homepage","contactform":"contactform"}}; </script> <script src="https://dagshub.com/wp-content/plugins/contact-form-7/modules/recaptcha/index.js?ver=5.9.8" id="wpcf7-recaptcha-js"></script> <a href="#page" id="top" class="top no-external-link-indicator" data-version="9.2.2"> <span class="screen-reader-text">Back to top</span> <span aria-hidden="true"><svg width="6" height="4" viewBox="0 0 6 4" fill="none" xmlns="http://www.w3.org/2000/svg"> <path d="M3 0.000342107L6 3.00034L5.4625 3.53784L3 1.06284L0.537501 3.52534L5.2492e-07 2.98784L3 0.000342107Z" fill="currentColor" /> </svg> </span> </a> </body> </html>