CINXE.COM

Text mining - Wikipedia

<!DOCTYPE html> <html class="client-nojs vector-feature-language-in-header-enabled vector-feature-language-in-main-page-header-disabled vector-feature-sticky-header-disabled vector-feature-page-tools-pinned-disabled vector-feature-toc-pinned-clientpref-1 vector-feature-main-menu-pinned-disabled vector-feature-limited-width-clientpref-1 vector-feature-limited-width-content-enabled vector-feature-custom-font-size-clientpref-1 vector-feature-appearance-pinned-clientpref-1 vector-feature-night-mode-enabled skin-theme-clientpref-day vector-toc-available" lang="en" dir="ltr"> <head> <meta charset="UTF-8"> <title>Text mining - Wikipedia</title> <script>(function(){var className="client-js vector-feature-language-in-header-enabled vector-feature-language-in-main-page-header-disabled vector-feature-sticky-header-disabled vector-feature-page-tools-pinned-disabled vector-feature-toc-pinned-clientpref-1 vector-feature-main-menu-pinned-disabled vector-feature-limited-width-clientpref-1 vector-feature-limited-width-content-enabled vector-feature-custom-font-size-clientpref-1 vector-feature-appearance-pinned-clientpref-1 vector-feature-night-mode-enabled skin-theme-clientpref-day vector-toc-available";var cookie=document.cookie.match(/(?:^|; )enwikimwclientpreferences=([^;]+)/);if(cookie){cookie[1].split('%2C').forEach(function(pref){className=className.replace(new RegExp('(^| )'+pref.replace(/-clientpref-\w+$|[^\w-]+/g,'')+'-clientpref-\\w+( |$)'),'$1'+pref+'$2');});}document.documentElement.className=className;}());RLCONF={"wgBreakFrames":false,"wgSeparatorTransformTable":["",""],"wgDigitTransformTable":["",""],"wgDefaultDateFormat":"dmy", "wgMonthNames":["","January","February","March","April","May","June","July","August","September","October","November","December"],"wgRequestId":"ccf64fe3-6299-40ca-8c90-7369c4bc5c94","wgCanonicalNamespace":"","wgCanonicalSpecialPageName":false,"wgNamespaceNumber":0,"wgPageName":"Text_mining","wgTitle":"Text mining","wgCurRevisionId":1251100761,"wgRevisionId":1251100761,"wgArticleId":318439,"wgIsArticle":true,"wgIsRedirect":false,"wgAction":"view","wgUserName":null,"wgUserGroups":["*"],"wgCategories":["Webarchive template wayback links","CS1 Portuguese-language sources (pt)","Articles with short description","Short description matches Wikidata","All articles with unsourced statements","Articles with unsourced statements from October 2022","Text mining","Applied data mining","Computational linguistics","Natural language processing","Statistical natural language processing","Text"],"wgPageViewLanguage":"en","wgPageContentLanguage":"en","wgPageContentModel":"wikitext","wgRelevantPageName": "Text_mining","wgRelevantArticleId":318439,"wgIsProbablyEditable":true,"wgRelevantPageIsProbablyEditable":true,"wgRestrictionEdit":[],"wgRestrictionMove":[],"wgNoticeProject":"wikipedia","wgCiteReferencePreviewsActive":false,"wgFlaggedRevsParams":{"tags":{"status":{"levels":1}}},"wgMediaViewerOnClick":true,"wgMediaViewerEnabledByDefault":true,"wgPopupsFlags":0,"wgVisualEditor":{"pageLanguageCode":"en","pageLanguageDir":"ltr","pageVariantFallbacks":"en"},"wgMFDisplayWikibaseDescriptions":{"search":true,"watchlist":true,"tagline":false,"nearby":true},"wgWMESchemaEditAttemptStepOversample":false,"wgWMEPageLength":40000,"wgRelatedArticlesCompat":[],"wgCentralAuthMobileDomain":false,"wgEditSubmitButtonLabelPublish":true,"wgULSPosition":"interlanguage","wgULSisCompactLinksEnabled":false,"wgVector2022LanguageInHeader":true,"wgULSisLanguageSelectorEmpty":false,"wgWikibaseItemId":"Q676880","wgCheckUserClientHintsHeadersJsApi":["brands","architecture","bitness","fullVersionList","mobile","model" ,"platform","platformVersion"],"GEHomepageSuggestedEditsEnableTopics":true,"wgGETopicsMatchModeEnabled":false,"wgGEStructuredTaskRejectionReasonTextInputEnabled":false,"wgGELevelingUpEnabledForUser":false};RLSTATE={"ext.globalCssJs.user.styles":"ready","site.styles":"ready","user.styles":"ready","ext.globalCssJs.user":"ready","user":"ready","user.options":"loading","ext.cite.styles":"ready","ext.tmh.player.styles":"ready","skins.vector.search.codex.styles":"ready","skins.vector.styles":"ready","skins.vector.icons":"ready","jquery.makeCollapsible.styles":"ready","ext.wikimediamessages.styles":"ready","ext.visualEditor.desktopArticleTarget.noscript":"ready","ext.uls.interlanguage":"ready","wikibase.client.init":"ready","ext.wikimediaBadges":"ready"};RLPAGEMODULES=["ext.cite.ux-enhancements","mediawiki.page.media","ext.tmh.player","site","mediawiki.page.ready","jquery.makeCollapsible","mediawiki.toc","skins.vector.js","ext.centralNotice.geoIP","ext.centralNotice.startUp", "ext.gadget.ReferenceTooltips","ext.gadget.switcher","ext.urlShortener.toolbar","ext.centralauth.centralautologin","mmv.bootstrap","ext.popups","ext.visualEditor.desktopArticleTarget.init","ext.visualEditor.targetLoader","ext.echo.centralauth","ext.eventLogging","ext.wikimediaEvents","ext.navigationTiming","ext.uls.interface","ext.cx.eventlogging.campaigns","ext.cx.uls.quick.actions","wikibase.client.vector-2022","ext.checkUser.clientHints","ext.growthExperiments.SuggestedEditSession","wikibase.sidebar.tracking"];</script> <script>(RLQ=window.RLQ||[]).push(function(){mw.loader.impl(function(){return["user.options@12s5i",function($,jQuery,require,module){mw.user.tokens.set({"patrolToken":"+\\","watchToken":"+\\","csrfToken":"+\\"}); }];});});</script> <link rel="stylesheet" href="/w/load.php?lang=en&amp;modules=ext.cite.styles%7Cext.tmh.player.styles%7Cext.uls.interlanguage%7Cext.visualEditor.desktopArticleTarget.noscript%7Cext.wikimediaBadges%7Cext.wikimediamessages.styles%7Cjquery.makeCollapsible.styles%7Cskins.vector.icons%2Cstyles%7Cskins.vector.search.codex.styles%7Cwikibase.client.init&amp;only=styles&amp;skin=vector-2022"> <script async="" src="/w/load.php?lang=en&amp;modules=startup&amp;only=scripts&amp;raw=1&amp;skin=vector-2022"></script> <meta name="ResourceLoaderDynamicStyles" content=""> <link rel="stylesheet" href="/w/load.php?lang=en&amp;modules=site.styles&amp;only=styles&amp;skin=vector-2022"> <meta name="generator" content="MediaWiki 1.44.0-wmf.4"> <meta name="referrer" content="origin"> <meta name="referrer" content="origin-when-cross-origin"> <meta name="robots" content="max-image-preview:standard"> <meta name="format-detection" content="telephone=no"> <meta name="viewport" content="width=1120"> <meta property="og:title" content="Text mining - Wikipedia"> <meta property="og:type" content="website"> <link rel="preconnect" href="//upload.wikimedia.org"> <link rel="alternate" media="only screen and (max-width: 640px)" href="//en.m.wikipedia.org/wiki/Text_mining"> <link rel="alternate" type="application/x-wiki" title="Edit this page" href="/w/index.php?title=Text_mining&amp;action=edit"> <link rel="apple-touch-icon" href="/static/apple-touch/wikipedia.png"> <link rel="icon" href="/static/favicon/wikipedia.ico"> <link rel="search" type="application/opensearchdescription+xml" href="/w/rest.php/v1/search" title="Wikipedia (en)"> <link rel="EditURI" type="application/rsd+xml" href="//en.wikipedia.org/w/api.php?action=rsd"> <link rel="canonical" href="https://en.wikipedia.org/wiki/Text_mining"> <link rel="license" href="https://creativecommons.org/licenses/by-sa/4.0/deed.en"> <link rel="alternate" type="application/atom+xml" title="Wikipedia Atom feed" href="/w/index.php?title=Special:RecentChanges&amp;feed=atom"> <link rel="dns-prefetch" href="//meta.wikimedia.org" /> <link rel="dns-prefetch" href="//login.wikimedia.org"> </head> <body class="skin--responsive skin-vector skin-vector-search-vue mediawiki ltr sitedir-ltr mw-hide-empty-elt ns-0 ns-subject mw-editable page-Text_mining rootpage-Text_mining skin-vector-2022 action-view"><a class="mw-jump-link" href="#bodyContent">Jump to content</a> <div class="vector-header-container"> <header class="vector-header mw-header"> <div class="vector-header-start"> <nav class="vector-main-menu-landmark" aria-label="Site"> <div id="vector-main-menu-dropdown" class="vector-dropdown vector-main-menu-dropdown vector-button-flush-left vector-button-flush-right" > <input type="checkbox" id="vector-main-menu-dropdown-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-vector-main-menu-dropdown" class="vector-dropdown-checkbox " aria-label="Main menu" > <label id="vector-main-menu-dropdown-label" for="vector-main-menu-dropdown-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet cdx-button--icon-only " aria-hidden="true" ><span class="vector-icon mw-ui-icon-menu mw-ui-icon-wikimedia-menu"></span> <span class="vector-dropdown-label-text">Main menu</span> </label> <div class="vector-dropdown-content"> <div id="vector-main-menu-unpinned-container" class="vector-unpinned-container"> <div id="vector-main-menu" class="vector-main-menu vector-pinnable-element"> <div class="vector-pinnable-header vector-main-menu-pinnable-header vector-pinnable-header-unpinned" data-feature-name="main-menu-pinned" data-pinnable-element-id="vector-main-menu" data-pinned-container-id="vector-main-menu-pinned-container" data-unpinned-container-id="vector-main-menu-unpinned-container" > <div class="vector-pinnable-header-label">Main menu</div> <button class="vector-pinnable-header-toggle-button vector-pinnable-header-pin-button" data-event-name="pinnable-header.vector-main-menu.pin">move to sidebar</button> <button class="vector-pinnable-header-toggle-button vector-pinnable-header-unpin-button" data-event-name="pinnable-header.vector-main-menu.unpin">hide</button> </div> <div id="p-navigation" class="vector-menu mw-portlet mw-portlet-navigation" > <div class="vector-menu-heading"> Navigation </div> <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li id="n-mainpage-description" class="mw-list-item"><a href="/wiki/Main_Page" title="Visit the main page [z]" accesskey="z"><span>Main page</span></a></li><li id="n-contents" class="mw-list-item"><a href="/wiki/Wikipedia:Contents" title="Guides to browsing Wikipedia"><span>Contents</span></a></li><li id="n-currentevents" class="mw-list-item"><a href="/wiki/Portal:Current_events" title="Articles related to current events"><span>Current events</span></a></li><li id="n-randompage" class="mw-list-item"><a href="/wiki/Special:Random" title="Visit a randomly selected article [x]" accesskey="x"><span>Random article</span></a></li><li id="n-aboutsite" class="mw-list-item"><a href="/wiki/Wikipedia:About" title="Learn about Wikipedia and how it works"><span>About Wikipedia</span></a></li><li id="n-contactpage" class="mw-list-item"><a href="//en.wikipedia.org/wiki/Wikipedia:Contact_us" title="How to contact Wikipedia"><span>Contact us</span></a></li> </ul> </div> </div> <div id="p-interaction" class="vector-menu mw-portlet mw-portlet-interaction" > <div class="vector-menu-heading"> Contribute </div> <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li id="n-help" class="mw-list-item"><a href="/wiki/Help:Contents" title="Guidance on how to use and edit Wikipedia"><span>Help</span></a></li><li id="n-introduction" class="mw-list-item"><a href="/wiki/Help:Introduction" title="Learn how to edit Wikipedia"><span>Learn to edit</span></a></li><li id="n-portal" class="mw-list-item"><a href="/wiki/Wikipedia:Community_portal" title="The hub for editors"><span>Community portal</span></a></li><li id="n-recentchanges" class="mw-list-item"><a href="/wiki/Special:RecentChanges" title="A list of recent changes to Wikipedia [r]" accesskey="r"><span>Recent changes</span></a></li><li id="n-upload" class="mw-list-item"><a href="/wiki/Wikipedia:File_upload_wizard" title="Add images or other media for use on Wikipedia"><span>Upload file</span></a></li> </ul> </div> </div> </div> </div> </div> </div> </nav> <a href="/wiki/Main_Page" class="mw-logo"> <img class="mw-logo-icon" src="/static/images/icons/wikipedia.png" alt="" aria-hidden="true" height="50" width="50"> <span class="mw-logo-container skin-invert"> <img class="mw-logo-wordmark" alt="Wikipedia" src="/static/images/mobile/copyright/wikipedia-wordmark-en.svg" style="width: 7.5em; height: 1.125em;"> <img class="mw-logo-tagline" alt="The Free Encyclopedia" src="/static/images/mobile/copyright/wikipedia-tagline-en.svg" width="117" height="13" style="width: 7.3125em; height: 0.8125em;"> </span> </a> </div> <div class="vector-header-end"> <div id="p-search" role="search" class="vector-search-box-vue vector-search-box-collapses vector-search-box-show-thumbnail vector-search-box-auto-expand-width vector-search-box"> <a href="/wiki/Special:Search" class="cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet cdx-button--icon-only search-toggle" title="Search Wikipedia [f]" accesskey="f"><span class="vector-icon mw-ui-icon-search mw-ui-icon-wikimedia-search"></span> <span>Search</span> </a> <div class="vector-typeahead-search-container"> <div class="cdx-typeahead-search cdx-typeahead-search--show-thumbnail cdx-typeahead-search--auto-expand-width"> <form action="/w/index.php" id="searchform" class="cdx-search-input cdx-search-input--has-end-button"> <div id="simpleSearch" class="cdx-search-input__input-wrapper" data-search-loc="header-moved"> <div class="cdx-text-input cdx-text-input--has-start-icon"> <input class="cdx-text-input__input" type="search" name="search" placeholder="Search Wikipedia" aria-label="Search Wikipedia" autocapitalize="sentences" title="Search Wikipedia [f]" accesskey="f" id="searchInput" > <span class="cdx-text-input__icon cdx-text-input__start-icon"></span> </div> <input type="hidden" name="title" value="Special:Search"> </div> <button class="cdx-button cdx-search-input__end-button">Search</button> </form> </div> </div> </div> <nav class="vector-user-links vector-user-links-wide" aria-label="Personal tools"> <div class="vector-user-links-main"> <div id="p-vector-user-menu-preferences" class="vector-menu mw-portlet emptyPortlet" > <div class="vector-menu-content"> <ul class="vector-menu-content-list"> </ul> </div> </div> <div id="p-vector-user-menu-userpage" class="vector-menu mw-portlet emptyPortlet" > <div class="vector-menu-content"> <ul class="vector-menu-content-list"> </ul> </div> </div> <nav class="vector-appearance-landmark" aria-label="Appearance"> <div id="vector-appearance-dropdown" class="vector-dropdown " title="Change the appearance of the page&#039;s font size, width, and color" > <input type="checkbox" id="vector-appearance-dropdown-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-vector-appearance-dropdown" class="vector-dropdown-checkbox " aria-label="Appearance" > <label id="vector-appearance-dropdown-label" for="vector-appearance-dropdown-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet cdx-button--icon-only " aria-hidden="true" ><span class="vector-icon mw-ui-icon-appearance mw-ui-icon-wikimedia-appearance"></span> <span class="vector-dropdown-label-text">Appearance</span> </label> <div class="vector-dropdown-content"> <div id="vector-appearance-unpinned-container" class="vector-unpinned-container"> </div> </div> </div> </nav> <div id="p-vector-user-menu-notifications" class="vector-menu mw-portlet emptyPortlet" > <div class="vector-menu-content"> <ul class="vector-menu-content-list"> </ul> </div> </div> <div id="p-vector-user-menu-overflow" class="vector-menu mw-portlet" > <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li id="pt-sitesupport-2" class="user-links-collapsible-item mw-list-item user-links-collapsible-item"><a data-mw="interface" href="https://donate.wikimedia.org/wiki/Special:FundraiserRedirector?utm_source=donate&amp;utm_medium=sidebar&amp;utm_campaign=C13_en.wikipedia.org&amp;uselang=en" class=""><span>Donate</span></a> </li> <li id="pt-createaccount-2" class="user-links-collapsible-item mw-list-item user-links-collapsible-item"><a data-mw="interface" href="/w/index.php?title=Special:CreateAccount&amp;returnto=Text+mining" title="You are encouraged to create an account and log in; however, it is not mandatory" class=""><span>Create account</span></a> </li> <li id="pt-login-2" class="user-links-collapsible-item mw-list-item user-links-collapsible-item"><a data-mw="interface" href="/w/index.php?title=Special:UserLogin&amp;returnto=Text+mining" title="You&#039;re encouraged to log in; however, it&#039;s not mandatory. [o]" accesskey="o" class=""><span>Log in</span></a> </li> </ul> </div> </div> </div> <div id="vector-user-links-dropdown" class="vector-dropdown vector-user-menu vector-button-flush-right vector-user-menu-logged-out" title="Log in and more options" > <input type="checkbox" id="vector-user-links-dropdown-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-vector-user-links-dropdown" class="vector-dropdown-checkbox " aria-label="Personal tools" > <label id="vector-user-links-dropdown-label" for="vector-user-links-dropdown-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet cdx-button--icon-only " aria-hidden="true" ><span class="vector-icon mw-ui-icon-ellipsis mw-ui-icon-wikimedia-ellipsis"></span> <span class="vector-dropdown-label-text">Personal tools</span> </label> <div class="vector-dropdown-content"> <div id="p-personal" class="vector-menu mw-portlet mw-portlet-personal user-links-collapsible-item" title="User menu" > <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li id="pt-sitesupport" class="user-links-collapsible-item mw-list-item"><a href="https://donate.wikimedia.org/wiki/Special:FundraiserRedirector?utm_source=donate&amp;utm_medium=sidebar&amp;utm_campaign=C13_en.wikipedia.org&amp;uselang=en"><span>Donate</span></a></li><li id="pt-createaccount" class="user-links-collapsible-item mw-list-item"><a href="/w/index.php?title=Special:CreateAccount&amp;returnto=Text+mining" title="You are encouraged to create an account and log in; however, it is not mandatory"><span class="vector-icon mw-ui-icon-userAdd mw-ui-icon-wikimedia-userAdd"></span> <span>Create account</span></a></li><li id="pt-login" class="user-links-collapsible-item mw-list-item"><a href="/w/index.php?title=Special:UserLogin&amp;returnto=Text+mining" title="You&#039;re encouraged to log in; however, it&#039;s not mandatory. [o]" accesskey="o"><span class="vector-icon mw-ui-icon-logIn mw-ui-icon-wikimedia-logIn"></span> <span>Log in</span></a></li> </ul> </div> </div> <div id="p-user-menu-anon-editor" class="vector-menu mw-portlet mw-portlet-user-menu-anon-editor" > <div class="vector-menu-heading"> Pages for logged out editors <a href="/wiki/Help:Introduction" aria-label="Learn more about editing"><span>learn more</span></a> </div> <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li id="pt-anoncontribs" class="mw-list-item"><a href="/wiki/Special:MyContributions" title="A list of edits made from this IP address [y]" accesskey="y"><span>Contributions</span></a></li><li id="pt-anontalk" class="mw-list-item"><a href="/wiki/Special:MyTalk" title="Discussion about edits from this IP address [n]" accesskey="n"><span>Talk</span></a></li> </ul> </div> </div> </div> </div> </nav> </div> </header> </div> <div class="mw-page-container"> <div class="mw-page-container-inner"> <div class="vector-sitenotice-container"> <div id="siteNotice"><!-- CentralNotice --></div> </div> <div class="vector-column-start"> <div class="vector-main-menu-container"> <div id="mw-navigation"> <nav id="mw-panel" class="vector-main-menu-landmark" aria-label="Site"> <div id="vector-main-menu-pinned-container" class="vector-pinned-container"> </div> </nav> </div> </div> <div class="vector-sticky-pinned-container"> <nav id="mw-panel-toc" aria-label="Contents" data-event-name="ui.sidebar-toc" class="mw-table-of-contents-container vector-toc-landmark"> <div id="vector-toc-pinned-container" class="vector-pinned-container"> <div id="vector-toc" class="vector-toc vector-pinnable-element"> <div class="vector-pinnable-header vector-toc-pinnable-header vector-pinnable-header-pinned" data-feature-name="toc-pinned" data-pinnable-element-id="vector-toc" > <h2 class="vector-pinnable-header-label">Contents</h2> <button class="vector-pinnable-header-toggle-button vector-pinnable-header-pin-button" data-event-name="pinnable-header.vector-toc.pin">move to sidebar</button> <button class="vector-pinnable-header-toggle-button vector-pinnable-header-unpin-button" data-event-name="pinnable-header.vector-toc.unpin">hide</button> </div> <ul class="vector-toc-contents" id="mw-panel-toc-list"> <li id="toc-mw-content-text" class="vector-toc-list-item vector-toc-level-1"> <a href="#" class="vector-toc-link"> <div class="vector-toc-text">(Top)</div> </a> </li> <li id="toc-Text_analytics" class="vector-toc-list-item vector-toc-level-1 vector-toc-list-item-expanded"> <a class="vector-toc-link" href="#Text_analytics"> <div class="vector-toc-text"> <span class="vector-toc-numb">1</span> <span>Text analytics</span> </div> </a> <ul id="toc-Text_analytics-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Text_analysis_processes" class="vector-toc-list-item vector-toc-level-1 vector-toc-list-item-expanded"> <a class="vector-toc-link" href="#Text_analysis_processes"> <div class="vector-toc-text"> <span class="vector-toc-numb">2</span> <span>Text analysis processes</span> </div> </a> <ul id="toc-Text_analysis_processes-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Applications" class="vector-toc-list-item vector-toc-level-1 vector-toc-list-item-expanded"> <a class="vector-toc-link" href="#Applications"> <div class="vector-toc-text"> <span class="vector-toc-numb">3</span> <span>Applications</span> </div> </a> <button aria-controls="toc-Applications-sublist" class="cdx-button cdx-button--weight-quiet cdx-button--icon-only vector-toc-toggle"> <span class="vector-icon mw-ui-icon-wikimedia-expand"></span> <span>Toggle Applications subsection</span> </button> <ul id="toc-Applications-sublist" class="vector-toc-list"> <li id="toc-Security_applications" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Security_applications"> <div class="vector-toc-text"> <span class="vector-toc-numb">3.1</span> <span>Security applications</span> </div> </a> <ul id="toc-Security_applications-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Biomedical_applications" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Biomedical_applications"> <div class="vector-toc-text"> <span class="vector-toc-numb">3.2</span> <span>Biomedical applications</span> </div> </a> <ul id="toc-Biomedical_applications-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Software_applications" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Software_applications"> <div class="vector-toc-text"> <span class="vector-toc-numb">3.3</span> <span>Software applications</span> </div> </a> <ul id="toc-Software_applications-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Online_media_applications" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Online_media_applications"> <div class="vector-toc-text"> <span class="vector-toc-numb">3.4</span> <span>Online media applications</span> </div> </a> <ul id="toc-Online_media_applications-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Business_and_marketing_applications" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Business_and_marketing_applications"> <div class="vector-toc-text"> <span class="vector-toc-numb">3.5</span> <span>Business and marketing applications</span> </div> </a> <ul id="toc-Business_and_marketing_applications-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Sentiment_analysis" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Sentiment_analysis"> <div class="vector-toc-text"> <span class="vector-toc-numb">3.6</span> <span>Sentiment analysis</span> </div> </a> <ul id="toc-Sentiment_analysis-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Scientific_literature_mining_and_academic_applications" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Scientific_literature_mining_and_academic_applications"> <div class="vector-toc-text"> <span class="vector-toc-numb">3.7</span> <span>Scientific literature mining and academic applications</span> </div> </a> <ul id="toc-Scientific_literature_mining_and_academic_applications-sublist" class="vector-toc-list"> <li id="toc-Methods_for_scientific_literature_mining" class="vector-toc-list-item vector-toc-level-3"> <a class="vector-toc-link" href="#Methods_for_scientific_literature_mining"> <div class="vector-toc-text"> <span class="vector-toc-numb">3.7.1</span> <span>Methods for scientific literature mining</span> </div> </a> <ul id="toc-Methods_for_scientific_literature_mining-sublist" class="vector-toc-list"> </ul> </li> </ul> </li> <li id="toc-Digital_humanities_and_computational_sociology" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Digital_humanities_and_computational_sociology"> <div class="vector-toc-text"> <span class="vector-toc-numb">3.8</span> <span>Digital humanities and computational sociology</span> </div> </a> <ul id="toc-Digital_humanities_and_computational_sociology-sublist" class="vector-toc-list"> </ul> </li> </ul> </li> <li id="toc-Software" class="vector-toc-list-item vector-toc-level-1 vector-toc-list-item-expanded"> <a class="vector-toc-link" href="#Software"> <div class="vector-toc-text"> <span class="vector-toc-numb">4</span> <span>Software</span> </div> </a> <ul id="toc-Software-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Intellectual_property_law" class="vector-toc-list-item vector-toc-level-1 vector-toc-list-item-expanded"> <a class="vector-toc-link" href="#Intellectual_property_law"> <div class="vector-toc-text"> <span class="vector-toc-numb">5</span> <span>Intellectual property law</span> </div> </a> <button aria-controls="toc-Intellectual_property_law-sublist" class="cdx-button cdx-button--weight-quiet cdx-button--icon-only vector-toc-toggle"> <span class="vector-icon mw-ui-icon-wikimedia-expand"></span> <span>Toggle Intellectual property law subsection</span> </button> <ul id="toc-Intellectual_property_law-sublist" class="vector-toc-list"> <li id="toc-Situation_in_Europe" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Situation_in_Europe"> <div class="vector-toc-text"> <span class="vector-toc-numb">5.1</span> <span>Situation in Europe</span> </div> </a> <ul id="toc-Situation_in_Europe-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Situation_in_the_United_States" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Situation_in_the_United_States"> <div class="vector-toc-text"> <span class="vector-toc-numb">5.2</span> <span>Situation in the United States</span> </div> </a> <ul id="toc-Situation_in_the_United_States-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Situation_in_Australia" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Situation_in_Australia"> <div class="vector-toc-text"> <span class="vector-toc-numb">5.3</span> <span>Situation in Australia</span> </div> </a> <ul id="toc-Situation_in_Australia-sublist" class="vector-toc-list"> </ul> </li> </ul> </li> <li id="toc-Implications" class="vector-toc-list-item vector-toc-level-1 vector-toc-list-item-expanded"> <a class="vector-toc-link" href="#Implications"> <div class="vector-toc-text"> <span class="vector-toc-numb">6</span> <span>Implications</span> </div> </a> <ul id="toc-Implications-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-See_also" class="vector-toc-list-item vector-toc-level-1 vector-toc-list-item-expanded"> <a class="vector-toc-link" href="#See_also"> <div class="vector-toc-text"> <span class="vector-toc-numb">7</span> <span>See also</span> </div> </a> <ul id="toc-See_also-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-References" class="vector-toc-list-item vector-toc-level-1 vector-toc-list-item-expanded"> <a class="vector-toc-link" href="#References"> <div class="vector-toc-text"> <span class="vector-toc-numb">8</span> <span>References</span> </div> </a> <button aria-controls="toc-References-sublist" class="cdx-button cdx-button--weight-quiet cdx-button--icon-only vector-toc-toggle"> <span class="vector-icon mw-ui-icon-wikimedia-expand"></span> <span>Toggle References subsection</span> </button> <ul id="toc-References-sublist" class="vector-toc-list"> <li id="toc-Citations" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Citations"> <div class="vector-toc-text"> <span class="vector-toc-numb">8.1</span> <span>Citations</span> </div> </a> <ul id="toc-Citations-sublist" class="vector-toc-list"> </ul> </li> <li id="toc-Sources" class="vector-toc-list-item vector-toc-level-2"> <a class="vector-toc-link" href="#Sources"> <div class="vector-toc-text"> <span class="vector-toc-numb">8.2</span> <span>Sources</span> </div> </a> <ul id="toc-Sources-sublist" class="vector-toc-list"> </ul> </li> </ul> </li> <li id="toc-External_links" class="vector-toc-list-item vector-toc-level-1 vector-toc-list-item-expanded"> <a class="vector-toc-link" href="#External_links"> <div class="vector-toc-text"> <span class="vector-toc-numb">9</span> <span>External links</span> </div> </a> <ul id="toc-External_links-sublist" class="vector-toc-list"> </ul> </li> </ul> </div> </div> </nav> </div> </div> <div class="mw-content-container"> <main id="content" class="mw-body"> <header class="mw-body-header vector-page-titlebar"> <nav aria-label="Contents" class="vector-toc-landmark"> <div id="vector-page-titlebar-toc" class="vector-dropdown vector-page-titlebar-toc vector-button-flush-left" > <input type="checkbox" id="vector-page-titlebar-toc-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-vector-page-titlebar-toc" class="vector-dropdown-checkbox " aria-label="Toggle the table of contents" > <label id="vector-page-titlebar-toc-label" for="vector-page-titlebar-toc-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet cdx-button--icon-only " aria-hidden="true" ><span class="vector-icon mw-ui-icon-listBullet mw-ui-icon-wikimedia-listBullet"></span> <span class="vector-dropdown-label-text">Toggle the table of contents</span> </label> <div class="vector-dropdown-content"> <div id="vector-page-titlebar-toc-unpinned-container" class="vector-unpinned-container"> </div> </div> </div> </nav> <h1 id="firstHeading" class="firstHeading mw-first-heading"><span class="mw-page-title-main">Text mining</span></h1> <div id="p-lang-btn" class="vector-dropdown mw-portlet mw-portlet-lang" > <input type="checkbox" id="p-lang-btn-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-p-lang-btn" class="vector-dropdown-checkbox mw-interlanguage-selector" aria-label="Go to an article in another language. Available in 33 languages" > <label id="p-lang-btn-label" for="p-lang-btn-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet cdx-button--action-progressive mw-portlet-lang-heading-33" aria-hidden="true" ><span class="vector-icon mw-ui-icon-language-progressive mw-ui-icon-wikimedia-language-progressive"></span> <span class="vector-dropdown-label-text">33 languages</span> </label> <div class="vector-dropdown-content"> <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li class="interlanguage-link interwiki-ar mw-list-item"><a href="https://ar.wikipedia.org/wiki/%D8%AA%D9%86%D9%82%D9%8A%D8%A8_%D9%81%D9%8A_%D8%A7%D9%84%D9%86%D8%B5%D9%88%D8%B5" title="تنقيب في النصوص – Arabic" lang="ar" hreflang="ar" data-title="تنقيب في النصوص" data-language-autonym="العربية" data-language-local-name="Arabic" class="interlanguage-link-target"><span>العربية</span></a></li><li class="interlanguage-link interwiki-bg mw-list-item"><a href="https://bg.wikipedia.org/wiki/%D0%98%D0%B7%D0%B2%D0%BB%D0%B8%D1%87%D0%B0%D0%BD%D0%B5_%D0%BD%D0%B0_%D0%B7%D0%BD%D0%B0%D0%BD%D0%B8%D1%8F_%D0%BE%D1%82_%D1%82%D0%B5%D0%BA%D1%81%D1%82" title="Извличане на знания от текст – Bulgarian" lang="bg" hreflang="bg" data-title="Извличане на знания от текст" data-language-autonym="Български" data-language-local-name="Bulgarian" class="interlanguage-link-target"><span>Български</span></a></li><li class="interlanguage-link interwiki-bs mw-list-item"><a href="https://bs.wikipedia.org/wiki/Rudarenje_tekstualnih_podataka" title="Rudarenje tekstualnih podataka – Bosnian" lang="bs" hreflang="bs" data-title="Rudarenje tekstualnih podataka" data-language-autonym="Bosanski" data-language-local-name="Bosnian" class="interlanguage-link-target"><span>Bosanski</span></a></li><li class="interlanguage-link interwiki-ca mw-list-item"><a href="https://ca.wikipedia.org/wiki/Mineria_de_textos" title="Mineria de textos – Catalan" lang="ca" hreflang="ca" data-title="Mineria de textos" data-language-autonym="Català" data-language-local-name="Catalan" class="interlanguage-link-target"><span>Català</span></a></li><li class="interlanguage-link interwiki-cs mw-list-item"><a href="https://cs.wikipedia.org/wiki/Dolov%C3%A1n%C3%AD_z_textu" title="Dolování z textu – Czech" lang="cs" hreflang="cs" data-title="Dolování z textu" data-language-autonym="Čeština" data-language-local-name="Czech" class="interlanguage-link-target"><span>Čeština</span></a></li><li class="interlanguage-link interwiki-de mw-list-item"><a href="https://de.wikipedia.org/wiki/Text_Mining" title="Text Mining – German" lang="de" hreflang="de" data-title="Text Mining" data-language-autonym="Deutsch" data-language-local-name="German" class="interlanguage-link-target"><span>Deutsch</span></a></li><li class="interlanguage-link interwiki-et mw-list-item"><a href="https://et.wikipedia.org/wiki/Tekstikaeve" title="Tekstikaeve – Estonian" lang="et" hreflang="et" data-title="Tekstikaeve" data-language-autonym="Eesti" data-language-local-name="Estonian" class="interlanguage-link-target"><span>Eesti</span></a></li><li class="interlanguage-link interwiki-el mw-list-item"><a href="https://el.wikipedia.org/wiki/%CE%95%CE%BE%CF%8C%CF%81%CF%85%CE%BE%CE%B7_%CE%BA%CE%B5%CE%B9%CE%BC%CE%AD%CE%BD%CE%BF%CF%85" title="Εξόρυξη κειμένου – Greek" lang="el" hreflang="el" data-title="Εξόρυξη κειμένου" data-language-autonym="Ελληνικά" data-language-local-name="Greek" class="interlanguage-link-target"><span>Ελληνικά</span></a></li><li class="interlanguage-link interwiki-es mw-list-item"><a href="https://es.wikipedia.org/wiki/Miner%C3%ADa_de_textos" title="Minería de textos – Spanish" lang="es" hreflang="es" data-title="Minería de textos" data-language-autonym="Español" data-language-local-name="Spanish" class="interlanguage-link-target"><span>Español</span></a></li><li class="interlanguage-link interwiki-eu mw-list-item"><a href="https://eu.wikipedia.org/wiki/Testu-meatzaritza" title="Testu-meatzaritza – Basque" lang="eu" hreflang="eu" data-title="Testu-meatzaritza" data-language-autonym="Euskara" data-language-local-name="Basque" class="interlanguage-link-target"><span>Euskara</span></a></li><li class="interlanguage-link interwiki-fa mw-list-item"><a href="https://fa.wikipedia.org/wiki/%D9%85%D8%AA%D9%86%E2%80%8C%DA%A9%D8%A7%D9%88%DB%8C" title="متن‌کاوی – Persian" lang="fa" hreflang="fa" data-title="متن‌کاوی" data-language-autonym="فارسی" data-language-local-name="Persian" class="interlanguage-link-target"><span>فارسی</span></a></li><li class="interlanguage-link interwiki-fr mw-list-item"><a href="https://fr.wikipedia.org/wiki/Fouille_de_textes" title="Fouille de textes – French" lang="fr" hreflang="fr" data-title="Fouille de textes" data-language-autonym="Français" data-language-local-name="French" class="interlanguage-link-target"><span>Français</span></a></li><li class="interlanguage-link interwiki-ko mw-list-item"><a href="https://ko.wikipedia.org/wiki/%ED%85%8D%EC%8A%A4%ED%8A%B8_%EB%A7%88%EC%9D%B4%EB%8B%9D" title="텍스트 마이닝 – Korean" lang="ko" hreflang="ko" data-title="텍스트 마이닝" data-language-autonym="한국어" data-language-local-name="Korean" class="interlanguage-link-target"><span>한국어</span></a></li><li class="interlanguage-link interwiki-id mw-list-item"><a href="https://id.wikipedia.org/wiki/Penambangan_teks" title="Penambangan teks – Indonesian" lang="id" hreflang="id" data-title="Penambangan teks" data-language-autonym="Bahasa Indonesia" data-language-local-name="Indonesian" class="interlanguage-link-target"><span>Bahasa Indonesia</span></a></li><li class="interlanguage-link interwiki-it mw-list-item"><a href="https://it.wikipedia.org/wiki/Text_mining" title="Text mining – Italian" lang="it" hreflang="it" data-title="Text mining" data-language-autonym="Italiano" data-language-local-name="Italian" class="interlanguage-link-target"><span>Italiano</span></a></li><li class="interlanguage-link interwiki-he mw-list-item"><a href="https://he.wikipedia.org/wiki/%D7%9B%D7%A8%D7%99%D7%99%D7%AA_%D7%98%D7%A7%D7%A1%D7%98" title="כריית טקסט – Hebrew" lang="he" hreflang="he" data-title="כריית טקסט" data-language-autonym="עברית" data-language-local-name="Hebrew" class="interlanguage-link-target"><span>עברית</span></a></li><li class="interlanguage-link interwiki-kn mw-list-item"><a href="https://kn.wikipedia.org/wiki/%E0%B2%AA%E0%B2%A0%E0%B3%8D%E0%B2%AF_%E0%B2%97%E0%B2%A3%E0%B2%BF%E0%B2%97%E0%B2%BE%E0%B2%B0%E0%B2%BF%E0%B2%95%E0%B3%86" title="ಪಠ್ಯ ಗಣಿಗಾರಿಕೆ – Kannada" lang="kn" hreflang="kn" data-title="ಪಠ್ಯ ಗಣಿಗಾರಿಕೆ" data-language-autonym="ಕನ್ನಡ" data-language-local-name="Kannada" class="interlanguage-link-target"><span>ಕನ್ನಡ</span></a></li><li class="interlanguage-link interwiki-hu mw-list-item"><a href="https://hu.wikipedia.org/wiki/Sz%C3%B6vegb%C3%A1ny%C3%A1szat" title="Szövegbányászat – Hungarian" lang="hu" hreflang="hu" data-title="Szövegbányászat" data-language-autonym="Magyar" data-language-local-name="Hungarian" class="interlanguage-link-target"><span>Magyar</span></a></li><li class="interlanguage-link interwiki-nl mw-list-item"><a href="https://nl.wikipedia.org/wiki/Textmining" title="Textmining – Dutch" lang="nl" hreflang="nl" data-title="Textmining" data-language-autonym="Nederlands" data-language-local-name="Dutch" class="interlanguage-link-target"><span>Nederlands</span></a></li><li class="interlanguage-link interwiki-ja mw-list-item"><a href="https://ja.wikipedia.org/wiki/%E3%83%86%E3%82%AD%E3%82%B9%E3%83%88%E3%83%9E%E3%82%A4%E3%83%8B%E3%83%B3%E3%82%B0" title="テキストマイニング – Japanese" lang="ja" hreflang="ja" data-title="テキストマイニング" data-language-autonym="日本語" data-language-local-name="Japanese" class="interlanguage-link-target"><span>日本語</span></a></li><li class="interlanguage-link interwiki-uz mw-list-item"><a href="https://uz.wikipedia.org/wiki/Intellektual_matn_tahlili" title="Intellektual matn tahlili – Uzbek" lang="uz" hreflang="uz" data-title="Intellektual matn tahlili" data-language-autonym="Oʻzbekcha / ўзбекча" data-language-local-name="Uzbek" class="interlanguage-link-target"><span>Oʻzbekcha / ўзбекча</span></a></li><li class="interlanguage-link interwiki-pl mw-list-item"><a href="https://pl.wikipedia.org/wiki/Text_mining" title="Text mining – Polish" lang="pl" hreflang="pl" data-title="Text mining" data-language-autonym="Polski" data-language-local-name="Polish" class="interlanguage-link-target"><span>Polski</span></a></li><li class="interlanguage-link interwiki-pt mw-list-item"><a href="https://pt.wikipedia.org/wiki/Minera%C3%A7%C3%A3o_de_texto" title="Mineração de texto – Portuguese" lang="pt" hreflang="pt" data-title="Mineração de texto" data-language-autonym="Português" data-language-local-name="Portuguese" class="interlanguage-link-target"><span>Português</span></a></li><li class="interlanguage-link interwiki-ru mw-list-item"><a href="https://ru.wikipedia.org/wiki/%D0%98%D0%BD%D1%82%D0%B5%D0%BB%D0%BB%D0%B5%D0%BA%D1%82%D1%83%D0%B0%D0%BB%D1%8C%D0%BD%D1%8B%D0%B9_%D0%B0%D0%BD%D0%B0%D0%BB%D0%B8%D0%B7_%D1%82%D0%B5%D0%BA%D1%81%D1%82%D0%B0" title="Интеллектуальный анализ текста – Russian" lang="ru" hreflang="ru" data-title="Интеллектуальный анализ текста" data-language-autonym="Русский" data-language-local-name="Russian" class="interlanguage-link-target"><span>Русский</span></a></li><li class="interlanguage-link interwiki-sl mw-list-item"><a href="https://sl.wikipedia.org/wiki/Rudarjenje_besedil" title="Rudarjenje besedil – Slovenian" lang="sl" hreflang="sl" data-title="Rudarjenje besedil" data-language-autonym="Slovenščina" data-language-local-name="Slovenian" class="interlanguage-link-target"><span>Slovenščina</span></a></li><li class="interlanguage-link interwiki-fi mw-list-item"><a href="https://fi.wikipedia.org/wiki/Tekstinlouhinta" title="Tekstinlouhinta – Finnish" lang="fi" hreflang="fi" data-title="Tekstinlouhinta" data-language-autonym="Suomi" data-language-local-name="Finnish" class="interlanguage-link-target"><span>Suomi</span></a></li><li class="interlanguage-link interwiki-sv mw-list-item"><a href="https://sv.wikipedia.org/wiki/Text_mining" title="Text mining – Swedish" lang="sv" hreflang="sv" data-title="Text mining" data-language-autonym="Svenska" data-language-local-name="Swedish" class="interlanguage-link-target"><span>Svenska</span></a></li><li class="interlanguage-link interwiki-th mw-list-item"><a href="https://th.wikipedia.org/wiki/%E0%B8%81%E0%B8%B2%E0%B8%A3%E0%B8%97%E0%B8%B3%E0%B9%80%E0%B8%AB%E0%B8%A1%E0%B8%B7%E0%B8%AD%E0%B8%87%E0%B8%82%E0%B9%89%E0%B8%AD%E0%B8%84%E0%B8%A7%E0%B8%B2%E0%B8%A1" title="การทำเหมืองข้อความ – Thai" lang="th" hreflang="th" data-title="การทำเหมืองข้อความ" data-language-autonym="ไทย" data-language-local-name="Thai" class="interlanguage-link-target"><span>ไทย</span></a></li><li class="interlanguage-link interwiki-tr mw-list-item"><a href="https://tr.wikipedia.org/wiki/Metin_madencili%C4%9Fi" title="Metin madenciliği – Turkish" lang="tr" hreflang="tr" data-title="Metin madenciliği" data-language-autonym="Türkçe" data-language-local-name="Turkish" class="interlanguage-link-target"><span>Türkçe</span></a></li><li class="interlanguage-link interwiki-uk mw-list-item"><a href="https://uk.wikipedia.org/wiki/%D0%86%D0%BD%D1%82%D0%B5%D0%BB%D0%B5%D0%BA%D1%82%D1%83%D0%B0%D0%BB%D1%8C%D0%BD%D0%B8%D0%B9_%D0%B0%D0%BD%D0%B0%D0%BB%D1%96%D0%B7_%D1%82%D0%B5%D0%BA%D1%81%D1%82%D1%83" title="Інтелектуальний аналіз тексту – Ukrainian" lang="uk" hreflang="uk" data-title="Інтелектуальний аналіз тексту" data-language-autonym="Українська" data-language-local-name="Ukrainian" class="interlanguage-link-target"><span>Українська</span></a></li><li class="interlanguage-link interwiki-vi mw-list-item"><a href="https://vi.wikipedia.org/wiki/Khai_th%C3%A1c_v%C4%83n_b%E1%BA%A3n" title="Khai thác văn bản – Vietnamese" lang="vi" hreflang="vi" data-title="Khai thác văn bản" data-language-autonym="Tiếng Việt" data-language-local-name="Vietnamese" class="interlanguage-link-target"><span>Tiếng Việt</span></a></li><li class="interlanguage-link interwiki-zh-yue mw-list-item"><a href="https://zh-yue.wikipedia.org/wiki/%E6%96%87%E6%9C%AC%E6%8E%A2%E5%8B%98" title="文本探勘 – Cantonese" lang="yue" hreflang="yue" data-title="文本探勘" data-language-autonym="粵語" data-language-local-name="Cantonese" class="interlanguage-link-target"><span>粵語</span></a></li><li class="interlanguage-link interwiki-zh mw-list-item"><a href="https://zh.wikipedia.org/wiki/%E6%96%87%E6%9C%AC%E6%8C%96%E6%8E%98" title="文本挖掘 – Chinese" lang="zh" hreflang="zh" data-title="文本挖掘" data-language-autonym="中文" data-language-local-name="Chinese" class="interlanguage-link-target"><span>中文</span></a></li> </ul> <div class="after-portlet after-portlet-lang"><span class="wb-langlinks-edit wb-langlinks-link"><a href="https://www.wikidata.org/wiki/Special:EntityPage/Q676880#sitelinks-wikipedia" title="Edit interlanguage links" class="wbc-editpage">Edit links</a></span></div> </div> </div> </div> </header> <div class="vector-page-toolbar"> <div class="vector-page-toolbar-container"> <div id="left-navigation"> <nav aria-label="Namespaces"> <div id="p-associated-pages" class="vector-menu vector-menu-tabs mw-portlet mw-portlet-associated-pages" > <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li id="ca-nstab-main" class="selected vector-tab-noicon mw-list-item"><a href="/wiki/Text_mining" title="View the content page [c]" accesskey="c"><span>Article</span></a></li><li id="ca-talk" class="vector-tab-noicon mw-list-item"><a href="/wiki/Talk:Text_mining" rel="discussion" title="Discuss improvements to the content page [t]" accesskey="t"><span>Talk</span></a></li> </ul> </div> </div> <div id="vector-variants-dropdown" class="vector-dropdown emptyPortlet" > <input type="checkbox" id="vector-variants-dropdown-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-vector-variants-dropdown" class="vector-dropdown-checkbox " aria-label="Change language variant" > <label id="vector-variants-dropdown-label" for="vector-variants-dropdown-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet" aria-hidden="true" ><span class="vector-dropdown-label-text">English</span> </label> <div class="vector-dropdown-content"> <div id="p-variants" class="vector-menu mw-portlet mw-portlet-variants emptyPortlet" > <div class="vector-menu-content"> <ul class="vector-menu-content-list"> </ul> </div> </div> </div> </div> </nav> </div> <div id="right-navigation" class="vector-collapsible"> <nav aria-label="Views"> <div id="p-views" class="vector-menu vector-menu-tabs mw-portlet mw-portlet-views" > <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li id="ca-view" class="selected vector-tab-noicon mw-list-item"><a href="/wiki/Text_mining"><span>Read</span></a></li><li id="ca-edit" class="vector-tab-noicon mw-list-item"><a href="/w/index.php?title=Text_mining&amp;action=edit" title="Edit this page [e]" accesskey="e"><span>Edit</span></a></li><li id="ca-history" class="vector-tab-noicon mw-list-item"><a href="/w/index.php?title=Text_mining&amp;action=history" title="Past revisions of this page [h]" accesskey="h"><span>View history</span></a></li> </ul> </div> </div> </nav> <nav class="vector-page-tools-landmark" aria-label="Page tools"> <div id="vector-page-tools-dropdown" class="vector-dropdown vector-page-tools-dropdown" > <input type="checkbox" id="vector-page-tools-dropdown-checkbox" role="button" aria-haspopup="true" data-event-name="ui.dropdown-vector-page-tools-dropdown" class="vector-dropdown-checkbox " aria-label="Tools" > <label id="vector-page-tools-dropdown-label" for="vector-page-tools-dropdown-checkbox" class="vector-dropdown-label cdx-button cdx-button--fake-button cdx-button--fake-button--enabled cdx-button--weight-quiet" aria-hidden="true" ><span class="vector-dropdown-label-text">Tools</span> </label> <div class="vector-dropdown-content"> <div id="vector-page-tools-unpinned-container" class="vector-unpinned-container"> <div id="vector-page-tools" class="vector-page-tools vector-pinnable-element"> <div class="vector-pinnable-header vector-page-tools-pinnable-header vector-pinnable-header-unpinned" data-feature-name="page-tools-pinned" data-pinnable-element-id="vector-page-tools" data-pinned-container-id="vector-page-tools-pinned-container" data-unpinned-container-id="vector-page-tools-unpinned-container" > <div class="vector-pinnable-header-label">Tools</div> <button class="vector-pinnable-header-toggle-button vector-pinnable-header-pin-button" data-event-name="pinnable-header.vector-page-tools.pin">move to sidebar</button> <button class="vector-pinnable-header-toggle-button vector-pinnable-header-unpin-button" data-event-name="pinnable-header.vector-page-tools.unpin">hide</button> </div> <div id="p-cactions" class="vector-menu mw-portlet mw-portlet-cactions emptyPortlet vector-has-collapsible-items" title="More options" > <div class="vector-menu-heading"> Actions </div> <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li id="ca-more-view" class="selected vector-more-collapsible-item mw-list-item"><a href="/wiki/Text_mining"><span>Read</span></a></li><li id="ca-more-edit" class="vector-more-collapsible-item mw-list-item"><a href="/w/index.php?title=Text_mining&amp;action=edit" title="Edit this page [e]" accesskey="e"><span>Edit</span></a></li><li id="ca-more-history" class="vector-more-collapsible-item mw-list-item"><a href="/w/index.php?title=Text_mining&amp;action=history"><span>View history</span></a></li> </ul> </div> </div> <div id="p-tb" class="vector-menu mw-portlet mw-portlet-tb" > <div class="vector-menu-heading"> General </div> <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li id="t-whatlinkshere" class="mw-list-item"><a href="/wiki/Special:WhatLinksHere/Text_mining" title="List of all English Wikipedia pages containing links to this page [j]" accesskey="j"><span>What links here</span></a></li><li id="t-recentchangeslinked" class="mw-list-item"><a href="/wiki/Special:RecentChangesLinked/Text_mining" rel="nofollow" title="Recent changes in pages linked from this page [k]" accesskey="k"><span>Related changes</span></a></li><li id="t-upload" class="mw-list-item"><a href="/wiki/Wikipedia:File_Upload_Wizard" title="Upload files [u]" accesskey="u"><span>Upload file</span></a></li><li id="t-specialpages" class="mw-list-item"><a href="/wiki/Special:SpecialPages" title="A list of all special pages [q]" accesskey="q"><span>Special pages</span></a></li><li id="t-permalink" class="mw-list-item"><a href="/w/index.php?title=Text_mining&amp;oldid=1251100761" title="Permanent link to this revision of this page"><span>Permanent link</span></a></li><li id="t-info" class="mw-list-item"><a href="/w/index.php?title=Text_mining&amp;action=info" title="More information about this page"><span>Page information</span></a></li><li id="t-cite" class="mw-list-item"><a href="/w/index.php?title=Special:CiteThisPage&amp;page=Text_mining&amp;id=1251100761&amp;wpFormIdentifier=titleform" title="Information on how to cite this page"><span>Cite this page</span></a></li><li id="t-urlshortener" class="mw-list-item"><a href="/w/index.php?title=Special:UrlShortener&amp;url=https%3A%2F%2Fen.wikipedia.org%2Fwiki%2FText_mining"><span>Get shortened URL</span></a></li><li id="t-urlshortener-qrcode" class="mw-list-item"><a href="/w/index.php?title=Special:QrCode&amp;url=https%3A%2F%2Fen.wikipedia.org%2Fwiki%2FText_mining"><span>Download QR code</span></a></li> </ul> </div> </div> <div id="p-coll-print_export" class="vector-menu mw-portlet mw-portlet-coll-print_export" > <div class="vector-menu-heading"> Print/export </div> <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li id="coll-download-as-rl" class="mw-list-item"><a href="/w/index.php?title=Special:DownloadAsPdf&amp;page=Text_mining&amp;action=show-download-screen" title="Download this page as a PDF file"><span>Download as PDF</span></a></li><li id="t-print" class="mw-list-item"><a href="/w/index.php?title=Text_mining&amp;printable=yes" title="Printable version of this page [p]" accesskey="p"><span>Printable version</span></a></li> </ul> </div> </div> <div id="p-wikibase-otherprojects" class="vector-menu mw-portlet mw-portlet-wikibase-otherprojects" > <div class="vector-menu-heading"> In other projects </div> <div class="vector-menu-content"> <ul class="vector-menu-content-list"> <li class="wb-otherproject-link wb-otherproject-commons mw-list-item"><a href="https://commons.wikimedia.org/wiki/Category:Text_mining" hreflang="en"><span>Wikimedia Commons</span></a></li><li id="t-wikibase" class="wb-otherproject-link wb-otherproject-wikibase-dataitem mw-list-item"><a href="https://www.wikidata.org/wiki/Special:EntityPage/Q676880" title="Structured data on this page hosted by Wikidata [g]" accesskey="g"><span>Wikidata item</span></a></li> </ul> </div> </div> </div> </div> </div> </div> </nav> </div> </div> </div> <div class="vector-column-end"> <div class="vector-sticky-pinned-container"> <nav class="vector-page-tools-landmark" aria-label="Page tools"> <div id="vector-page-tools-pinned-container" class="vector-pinned-container"> </div> </nav> <nav class="vector-appearance-landmark" aria-label="Appearance"> <div id="vector-appearance-pinned-container" class="vector-pinned-container"> <div id="vector-appearance" class="vector-appearance vector-pinnable-element"> <div class="vector-pinnable-header vector-appearance-pinnable-header vector-pinnable-header-pinned" data-feature-name="appearance-pinned" data-pinnable-element-id="vector-appearance" data-pinned-container-id="vector-appearance-pinned-container" data-unpinned-container-id="vector-appearance-unpinned-container" > <div class="vector-pinnable-header-label">Appearance</div> <button class="vector-pinnable-header-toggle-button vector-pinnable-header-pin-button" data-event-name="pinnable-header.vector-appearance.pin">move to sidebar</button> <button class="vector-pinnable-header-toggle-button vector-pinnable-header-unpin-button" data-event-name="pinnable-header.vector-appearance.unpin">hide</button> </div> </div> </div> </nav> </div> </div> <div id="bodyContent" class="vector-body" aria-labelledby="firstHeading" data-mw-ve-target-container> <div class="vector-body-before-content"> <div class="mw-indicators"> </div> <div id="siteSub" class="noprint">From Wikipedia, the free encyclopedia</div> </div> <div id="contentSub"><div id="mw-content-subtitle"></div></div> <div id="mw-content-text" class="mw-body-content"><div class="mw-content-ltr mw-parser-output" lang="en" dir="ltr"><div class="shortdescription nomobile noexcerpt noprint searchaux" style="display:none">Process of analysing text to extract information from it</div> <p><b>Text mining</b>, <b>text data mining</b> (<b>TDM</b>) or <b>text analytics</b> is the process of deriving high-quality <a href="/wiki/Information" title="Information">information</a> from <a href="/wiki/Plain_text" title="Plain text">text</a>. It involves "the discovery by computer of new, previously unknown information, by automatically extracting information from different written resources."<sup id="cite_ref-1" class="reference"><a href="#cite_note-1"><span class="cite-bracket">&#91;</span>1<span class="cite-bracket">&#93;</span></a></sup> Written resources may include <a href="/wiki/Website" title="Website">websites</a>, <a href="/wiki/Book" title="Book">books</a>, <a href="/wiki/Email" title="Email">emails</a>, <a href="/wiki/Review" title="Review">reviews</a>, and articles. High-quality information is typically obtained by devising patterns and trends by means such as <a href="/wiki/Pattern_recognition" title="Pattern recognition">statistical pattern learning</a>. According to Hotho et al. (2005), there are three perspectives of text mining: <a href="/wiki/Information_extraction" title="Information extraction">information extraction</a>, <a href="/wiki/Data_mining" title="Data mining">data mining</a>, and <a href="/wiki/Knowledge_discovery_in_databases" class="mw-redirect" title="Knowledge discovery in databases">knowledge discovery in databases</a> (KDD).<sup id="cite_ref-2" class="reference"><a href="#cite_note-2"><span class="cite-bracket">&#91;</span>2<span class="cite-bracket">&#93;</span></a></sup> Text mining usually involves the process of structuring the input text (usually <a href="/wiki/Parsing" title="Parsing">parsing</a>, along with the addition of some derived linguistic features and the removal of others, and subsequent insertion into a <a href="/wiki/Database" title="Database">database</a>), deriving patterns within the <a href="/wiki/Structured_data" class="mw-redirect" title="Structured data">structured data</a>, and finally evaluation and interpretation of the output. 'High quality' in text mining usually refers to some combination of <a href="/wiki/Relevance_(information_retrieval)" title="Relevance (information retrieval)">relevance</a>, <a href="/wiki/Novelty_(patent)" title="Novelty (patent)">novelty</a>, and interest. Typical text mining tasks include <a href="/wiki/Text_categorization" class="mw-redirect" title="Text categorization">text categorization</a>, <a href="/wiki/Text_clustering" class="mw-redirect" title="Text clustering">text clustering</a>, concept/entity extraction, production of granular taxonomies, <a href="/wiki/Sentiment_analysis" title="Sentiment analysis">sentiment analysis</a>, <a href="/wiki/Document_summarization" class="mw-redirect" title="Document summarization">document summarization</a>, and <a href="/wiki/Entity%E2%80%93relationship_model" title="Entity–relationship model">entity relation modeling</a> (<i>i.e.</i>, learning relations between <a href="/wiki/Named_entity_recognition" class="mw-redirect" title="Named entity recognition">named entities</a>). </p><p>Text analysis involves <a href="/wiki/Information_retrieval" title="Information retrieval">information retrieval</a>, <a href="/wiki/Lexical_analysis" title="Lexical analysis">lexical analysis</a> to study word frequency distributions, <a href="/wiki/Pattern_recognition" title="Pattern recognition">pattern recognition</a>, <a href="/wiki/Tag_(metadata)" title="Tag (metadata)">tagging</a>/<a href="/wiki/Annotation" title="Annotation">annotation</a>, <a href="/wiki/Information_extraction" title="Information extraction">information extraction</a>, <a href="/wiki/Data_mining" title="Data mining">data mining</a> techniques including link and association analysis, <a href="/wiki/Information_visualization" class="mw-redirect" title="Information visualization">visualization</a>, and <a href="/wiki/Predictive_analytics" title="Predictive analytics">predictive analytics</a>. The overarching goal is, essentially, to turn text into data for analysis, via the application of <a href="/wiki/Natural_language_processing" title="Natural language processing">natural language processing</a> (NLP), different types of <a href="/wiki/Algorithm" title="Algorithm">algorithms</a> and analytical methods. An important phase of this process is the interpretation of the gathered information. </p><p>A typical application is to scan a set of documents written in a <a href="/wiki/Natural_language" title="Natural language">natural language</a> and either model the <a href="/wiki/Document" title="Document">document</a> set for <a href="/wiki/Predictive_classification" class="mw-redirect" title="Predictive classification">predictive classification</a> purposes or populate a database or search index with the information extracted. The <a href="/wiki/Document" title="Document">document</a> is the basic element when starting with text mining. Here, we define a document as a unit of textual data, which normally exists in many types of collections.<sup id="cite_ref-3" class="reference"><a href="#cite_note-3"><span class="cite-bracket">&#91;</span>3<span class="cite-bracket">&#93;</span></a></sup> </p> <meta property="mw:PageProp/toc" /> <div class="mw-heading mw-heading2"><h2 id="Text_analytics">Text analytics</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=1" title="Edit section: Text analytics"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <style data-mw-deduplicate="TemplateStyles:r1236090951">.mw-parser-output .hatnote{font-style:italic}.mw-parser-output div.hatnote{padding-left:1.6em;margin-bottom:0.5em}.mw-parser-output .hatnote i{font-style:normal}.mw-parser-output .hatnote+link+.hatnote{margin-top:-0.5em}@media print{body.ns-0 .mw-parser-output .hatnote{display:none!important}}</style><div role="note" class="hatnote navigation-not-searchable">See also: <a href="/wiki/List_of_text_mining_methods" title="List of text mining methods">List of text mining methods</a></div> <p><b>Text analytics</b> describes a set of <a href="/wiki/Linguistics" title="Linguistics">linguistic</a>, <a href="/wiki/Statistical" class="mw-redirect" title="Statistical">statistical</a>, and <a href="/wiki/Machine_learning" title="Machine learning">machine learning</a> techniques that model and structure the information content of textual sources for <a href="/wiki/Business_intelligence" title="Business intelligence">business intelligence</a>, <a href="/wiki/Exploratory_data_analysis" title="Exploratory data analysis">exploratory data analysis</a>, <a href="/wiki/Research" title="Research">research</a>, or investigation.<sup id="cite_ref-4" class="reference"><a href="#cite_note-4"><span class="cite-bracket">&#91;</span>4<span class="cite-bracket">&#93;</span></a></sup> The term is roughly synonymous with text mining; indeed, <a href="/w/index.php?title=Ronen_Feldman&amp;action=edit&amp;redlink=1" class="new" title="Ronen Feldman (page does not exist)">Ronen Feldman</a> modified a 2000 description of "text mining"<sup id="cite_ref-5" class="reference"><a href="#cite_note-5"><span class="cite-bracket">&#91;</span>5<span class="cite-bracket">&#93;</span></a></sup> in 2004 to describe "text analytics".<sup id="cite_ref-6" class="reference"><a href="#cite_note-6"><span class="cite-bracket">&#91;</span>6<span class="cite-bracket">&#93;</span></a></sup> The latter term is now used more frequently in business settings while "text mining" is used in some of the earliest application areas, dating to the 1980s,<sup id="cite_ref-7" class="reference"><a href="#cite_note-7"><span class="cite-bracket">&#91;</span>7<span class="cite-bracket">&#93;</span></a></sup> notably life-sciences research and government intelligence. </p><p>The term text analytics also describes that application of text analytics to respond to business problems, whether independently or in conjunction with query and analysis of fielded, numerical data. It is a truism that 80% of business-relevant information originates in <a href="/wiki/Unstructured_data" title="Unstructured data">unstructured</a> form, primarily text.<sup id="cite_ref-breakthroughanalysis1_8-0" class="reference"><a href="#cite_note-breakthroughanalysis1-8"><span class="cite-bracket">&#91;</span>8<span class="cite-bracket">&#93;</span></a></sup> These techniques and processes discover and present knowledge – facts, <a href="/wiki/Business_rule" title="Business rule">business rules</a>, and relationships – that is otherwise locked in textual form, impenetrable to automated processing. </p> <div class="mw-heading mw-heading2"><h2 id="Text_analysis_processes">Text analysis processes</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=2" title="Edit section: Text analysis processes"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>Subtasks—components of a larger text-analytics effort—typically include: </p> <ul><li><a href="/wiki/Dimensionality_reduction" title="Dimensionality reduction">Dimensionality reduction</a> is important technique for pre-processing data. It is used to identify the root word for actual words and reduce the size of the text data.<sup class="noprint Inline-Template Template-Fact" style="white-space:nowrap;">&#91;<i><a href="/wiki/Wikipedia:Citation_needed" title="Wikipedia:Citation needed"><span title="This claim needs references to reliable sources. (October 2022)">citation needed</span></a></i>&#93;</sup></li> <li><a href="/wiki/Information_retrieval" title="Information retrieval">Information retrieval</a> or identification of a <a href="/wiki/Text_corpus" title="Text corpus">corpus</a> is a preparatory step: collecting or identifying a set of textual materials, on the Web or held in a <a href="/wiki/File_system" title="File system">file system</a>, <a href="/wiki/Database" title="Database">database</a>, or content <a href="/wiki/Corpus_manager" title="Corpus manager">corpus manager</a>, for analysis.</li> <li>Although some text analytics systems apply exclusively advanced statistical methods, many others apply more extensive <a href="/wiki/Natural_language_processing" title="Natural language processing">natural language processing</a>, such as <a href="/wiki/Part_of_speech_tagging" class="mw-redirect" title="Part of speech tagging">part of speech tagging</a>, syntactic <a href="/wiki/Parsing" title="Parsing">parsing</a>, and other types of linguistic analysis.<sup id="cite_ref-9" class="reference"><a href="#cite_note-9"><span class="cite-bracket">&#91;</span>9<span class="cite-bracket">&#93;</span></a></sup></li> <li><a href="/wiki/Named_entity_recognition" class="mw-redirect" title="Named entity recognition">Named entity recognition</a> is the use of gazetteers or statistical techniques to identify named text features: people, organizations, place names, stock ticker symbols, certain abbreviations, and so on.</li> <li>Disambiguation—the use of <a href="/wiki/Context_(language_use)" class="mw-redirect" title="Context (language use)">contextual</a> clues—may be required to decide where, for instance, "Ford" can refer to a former U.S. president, a vehicle manufacturer, a movie star, a river crossing, or some other entity.<sup id="cite_ref-10" class="reference"><a href="#cite_note-10"><span class="cite-bracket">&#91;</span>10<span class="cite-bracket">&#93;</span></a></sup></li> <li>Recognition of pattern-identified entities: Features such as telephone numbers, e-mail addresses, quantities (with units) can be discerned via regular expression or other <a href="/wiki/Pattern_matching" title="Pattern matching">pattern matches</a>.</li> <li><a href="/wiki/Document_clustering" title="Document clustering">Document clustering</a>: identification of sets of similar text documents.<sup id="cite_ref-11" class="reference"><a href="#cite_note-11"><span class="cite-bracket">&#91;</span>11<span class="cite-bracket">&#93;</span></a></sup></li> <li><a href="/wiki/Coreference" title="Coreference">Coreference</a> resolution: identification of <a href="/wiki/Noun_phrase" title="Noun phrase">noun phrases</a> and other terms that refer to the same object.</li> <li>Extraction of relationships, facts and events: identification of associations among entities and other information in texts.</li> <li><a href="/wiki/Sentiment_analysis" title="Sentiment analysis">Sentiment analysis</a>: discerning of subjective material and extracting information about attitudes: sentiment, opinion, mood, and emotion. This is done at the entity, concept, or topic level and aims to distinguish opinion holders and objects.<sup id="cite_ref-12" class="reference"><a href="#cite_note-12"><span class="cite-bracket">&#91;</span>12<span class="cite-bracket">&#93;</span></a></sup></li> <li>Quantitative text analysis: a set of techniques stemming from the social sciences where either a human judge or a computer extracts semantic or grammatical relationships between words in order to find out the meaning or stylistic patterns of, usually, a casual personal text for the purpose of <a href="/wiki/Psychological_profiling" class="mw-redirect" title="Psychological profiling">psychological profiling</a> etc.<sup id="cite_ref-13" class="reference"><a href="#cite_note-13"><span class="cite-bracket">&#91;</span>13<span class="cite-bracket">&#93;</span></a></sup></li> <li>Pre-processing usually involves tasks such as tokenization, filtering and stemming.</li></ul> <div class="mw-heading mw-heading2"><h2 id="Applications">Applications</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=3" title="Edit section: Applications"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>Text mining technology is now broadly applied to a wide variety of government, research, and business needs. All these groups may use text mining for records management and searching documents relevant to their daily activities. Legal professionals may use text mining for <a href="/wiki/E-discovery" class="mw-redirect" title="E-discovery">e-discovery</a>, for example. Governments and military groups use text mining for <a href="/wiki/National_security" title="National security">national security</a> and intelligence purposes. Scientific researchers incorporate text mining approaches into efforts to organize large sets of text data (i.e., addressing the problem of <a href="/wiki/Unstructured_data" title="Unstructured data">unstructured data</a>), to determine ideas communicated through text (e.g., <a href="/wiki/Sentiment_analysis" title="Sentiment analysis">sentiment analysis</a> in <a href="/wiki/Social_media" title="Social media">social media</a><sup id="cite_ref-14" class="reference"><a href="#cite_note-14"><span class="cite-bracket">&#91;</span>14<span class="cite-bracket">&#93;</span></a></sup><sup id="cite_ref-15" class="reference"><a href="#cite_note-15"><span class="cite-bracket">&#91;</span>15<span class="cite-bracket">&#93;</span></a></sup><sup id="cite_ref-16" class="reference"><a href="#cite_note-16"><span class="cite-bracket">&#91;</span>16<span class="cite-bracket">&#93;</span></a></sup>) and to support <a href="/wiki/Scientific_discovery" class="mw-redirect" title="Scientific discovery">scientific discovery</a> in fields such as the <a href="/wiki/Life_sciences" class="mw-redirect" title="Life sciences">life sciences</a> and <a href="/wiki/Bioinformatics" title="Bioinformatics">bioinformatics</a>. In business, applications are used to support <a href="/wiki/Competitive_intelligence" title="Competitive intelligence">competitive intelligence</a> and automated <a href="/wiki/Ad_serving" class="mw-redirect" title="Ad serving">ad placement</a>, among numerous other activities. </p> <div class="mw-heading mw-heading3"><h3 id="Security_applications">Security applications</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=4" title="Edit section: Security applications"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>Many text mining software packages are marketed for <a href="/wiki/Security_appliance" title="Security appliance">security applications</a>, especially monitoring and analysis of online plain text sources such as <a href="/wiki/Internet_news" class="mw-redirect" title="Internet news">Internet news</a>, <a href="/wiki/Blog" title="Blog">blogs</a>, etc. for <a href="/wiki/National_security" title="National security">national security</a> purposes.<sup id="cite_ref-17" class="reference"><a href="#cite_note-17"><span class="cite-bracket">&#91;</span>17<span class="cite-bracket">&#93;</span></a></sup> It is also involved in the study of text <a href="/wiki/Encryption" title="Encryption">encryption</a>/<a href="/wiki/Decryption" class="mw-redirect" title="Decryption">decryption</a>. </p> <div class="mw-heading mw-heading3"><h3 id="Biomedical_applications">Biomedical applications</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=5" title="Edit section: Biomedical applications"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">Main article: <a href="/wiki/Biomedical_text_mining" title="Biomedical text mining">Biomedical text mining</a></div> <figure class="mw-default-size" typeof="mw:File/Thumb"><a href="/wiki/File:Text_mining_protocol.png" class="mw-file-description"><img alt="A flowchart of a text mining protocol." src="//upload.wikimedia.org/wikipedia/commons/thumb/2/21/Text_mining_protocol.png/220px-Text_mining_protocol.png" decoding="async" width="220" height="565" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/2/21/Text_mining_protocol.png 1.5x" data-file-width="237" data-file-height="609" /></a><figcaption>An example of a text mining protocol used in a study of protein-protein complexes, or <a href="/wiki/Protein_docking" class="mw-redirect" title="Protein docking">protein docking</a>.<sup id="cite_ref-18" class="reference"><a href="#cite_note-18"><span class="cite-bracket">&#91;</span>18<span class="cite-bracket">&#93;</span></a></sup></figcaption></figure> <p>A range of text mining applications in the biomedical literature has been described,<sup id="cite_ref-19" class="reference"><a href="#cite_note-19"><span class="cite-bracket">&#91;</span>19<span class="cite-bracket">&#93;</span></a></sup> including computational approaches to assist with studies in <a href="/wiki/Protein_docking" class="mw-redirect" title="Protein docking">protein docking</a>,<sup id="cite_ref-20" class="reference"><a href="#cite_note-20"><span class="cite-bracket">&#91;</span>20<span class="cite-bracket">&#93;</span></a></sup> <a href="/wiki/Protein_interactions" class="mw-redirect" title="Protein interactions">protein interactions</a>,<sup id="cite_ref-21" class="reference"><a href="#cite_note-21"><span class="cite-bracket">&#91;</span>21<span class="cite-bracket">&#93;</span></a></sup><sup id="cite_ref-22" class="reference"><a href="#cite_note-22"><span class="cite-bracket">&#91;</span>22<span class="cite-bracket">&#93;</span></a></sup> and protein-disease associations.<sup id="cite_ref-23" class="reference"><a href="#cite_note-23"><span class="cite-bracket">&#91;</span>23<span class="cite-bracket">&#93;</span></a></sup> In addition, with large patient textual datasets in the clinical field, datasets of demographic information in population studies and adverse event reports, text mining can facilitate clinical studies and precision medicine. Text mining algorithms can facilitate the stratification and indexing of specific clinical events in large patient textual datasets of symptoms, side effects, and comorbidities from electronic health records, event reports, and reports from specific diagnostic tests.<sup id="cite_ref-24" class="reference"><a href="#cite_note-24"><span class="cite-bracket">&#91;</span>24<span class="cite-bracket">&#93;</span></a></sup> One online text mining application in the biomedical literature is <a href="/wiki/PubGene" title="PubGene">PubGene</a>, a publicly accessible <a href="/wiki/Search_engine" title="Search engine">search engine</a> that combines biomedical text mining with network visualization.<sup id="cite_ref-25" class="reference"><a href="#cite_note-25"><span class="cite-bracket">&#91;</span>25<span class="cite-bracket">&#93;</span></a></sup><sup id="cite_ref-26" class="reference"><a href="#cite_note-26"><span class="cite-bracket">&#91;</span>26<span class="cite-bracket">&#93;</span></a></sup> <a href="/wiki/GoPubMed" title="GoPubMed">GoPubMed</a> is a knowledge-based search engine for biomedical texts. Text mining techniques also enable us to extract unknown knowledge from unstructured documents in the clinical domain<sup id="cite_ref-27" class="reference"><a href="#cite_note-27"><span class="cite-bracket">&#91;</span>27<span class="cite-bracket">&#93;</span></a></sup> </p> <div class="mw-heading mw-heading3"><h3 id="Software_applications">Software applications</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=6" title="Edit section: Software applications"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>Text mining methods and software is also being researched and developed by major firms, including <a href="/wiki/IBM" title="IBM">IBM</a> and <a href="/wiki/Microsoft" title="Microsoft">Microsoft</a>, to further automate the mining and analysis processes, and by different firms working in the area of search and indexing in general as a way to improve their results. Within the public sector, much effort has been concentrated on creating software for tracking and monitoring <a href="/wiki/Information_Awareness_Office" title="Information Awareness Office">terrorist activities</a>.<sup id="cite_ref-28" class="reference"><a href="#cite_note-28"><span class="cite-bracket">&#91;</span>28<span class="cite-bracket">&#93;</span></a></sup> For study purposes, <a href="/wiki/Weka_(machine_learning)" class="mw-redirect" title="Weka (machine learning)">Weka software</a> is one of the most popular options in the scientific world, acting as an excellent entry point for beginners. For Python programmers, there is an excellent toolkit called <a href="/wiki/Natural_Language_Toolkit" title="Natural Language Toolkit">NLTK</a> for more general purposes. For more advanced programmers, there's also the <a href="/wiki/Gensim" title="Gensim">Gensim</a> library, which focuses on word embedding-based text representations. </p> <div class="mw-heading mw-heading3"><h3 id="Online_media_applications">Online media applications</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=7" title="Edit section: Online media applications"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>Text mining is being used by large media companies, such as the <a href="/wiki/Tribune_Company" class="mw-redirect" title="Tribune Company">Tribune Company</a>, to clarify information and to provide readers with greater search experiences, which in turn increases site "stickiness" and revenue. Additionally, on the back end, editors are benefiting by being able to share, associate and package news across properties, significantly increasing opportunities to monetize content. </p> <div class="mw-heading mw-heading3"><h3 id="Business_and_marketing_applications">Business and marketing applications</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=8" title="Edit section: Business and marketing applications"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>Text analytics is being used in business, particularly, in marketing, such as in <a href="/wiki/Customer_relationship_management" title="Customer relationship management">customer relationship management</a>.<sup id="cite_ref-Text_Analytics:_The_Why_Behind_the_Score_29-0" class="reference"><a href="#cite_note-Text_Analytics:_The_Why_Behind_the_Score-29"><span class="cite-bracket">&#91;</span>29<span class="cite-bracket">&#93;</span></a></sup> Coussement and Van den Poel (2008)<sup id="cite_ref-10.1016/j.im.2008.01.005_30-0" class="reference"><a href="#cite_note-10.1016/j.im.2008.01.005-30"><span class="cite-bracket">&#91;</span>30<span class="cite-bracket">&#93;</span></a></sup><sup id="cite_ref-31" class="reference"><a href="#cite_note-31"><span class="cite-bracket">&#91;</span>31<span class="cite-bracket">&#93;</span></a></sup> apply it to improve <a href="/wiki/Predictive_analytics" title="Predictive analytics">predictive analytics</a> models for customer churn (<a href="/wiki/Customer_attrition" title="Customer attrition">customer attrition</a>).<sup id="cite_ref-10.1016/j.im.2008.01.005_30-1" class="reference"><a href="#cite_note-10.1016/j.im.2008.01.005-30"><span class="cite-bracket">&#91;</span>30<span class="cite-bracket">&#93;</span></a></sup> Text mining is also being applied in stock returns prediction.<sup id="cite_ref-Galvez2017_32-0" class="reference"><a href="#cite_note-Galvez2017-32"><span class="cite-bracket">&#91;</span>32<span class="cite-bracket">&#93;</span></a></sup> </p> <div class="mw-heading mw-heading3"><h3 id="Sentiment_analysis">Sentiment analysis</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=9" title="Edit section: Sentiment analysis"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p><a href="/wiki/Sentiment_analysis" title="Sentiment analysis">Sentiment analysis</a> may involve analysis of products such as movies, books, or hotel reviews for estimating how favorable a review is for the product.<sup id="cite_ref-33" class="reference"><a href="#cite_note-33"><span class="cite-bracket">&#91;</span>33<span class="cite-bracket">&#93;</span></a></sup> Such an analysis may need a labeled data set or labeling of the <a href="/wiki/Affect_(psychology)" title="Affect (psychology)">affectivity</a> of words. Resources for affectivity of words and concepts have been made for <a href="/wiki/WordNet" title="WordNet">WordNet</a><sup id="cite_ref-34" class="reference"><a href="#cite_note-34"><span class="cite-bracket">&#91;</span>34<span class="cite-bracket">&#93;</span></a></sup> and <a href="/wiki/ConceptNet" class="mw-redirect" title="ConceptNet">ConceptNet</a>,<sup id="cite_ref-camnet_35-0" class="reference"><a href="#cite_note-camnet-35"><span class="cite-bracket">&#91;</span>35<span class="cite-bracket">&#93;</span></a></sup> respectively. </p><p>Text has been used to detect emotions in the related area of affective computing.<sup id="cite_ref-36" class="reference"><a href="#cite_note-36"><span class="cite-bracket">&#91;</span>36<span class="cite-bracket">&#93;</span></a></sup> Text based approaches to affective computing have been used on multiple corpora such as students evaluations, children stories and news stories. </p> <div class="mw-heading mw-heading3"><h3 id="Scientific_literature_mining_and_academic_applications">Scientific literature mining and academic applications</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=10" title="Edit section: Scientific literature mining and academic applications"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>The issue of text mining is of importance to publishers who hold large <a href="/wiki/Database" title="Database">databases</a> of information needing <a href="/wiki/Index_(database)" class="mw-redirect" title="Index (database)">indexing</a> for retrieval. This is especially true in scientific disciplines, in which highly specific information is often contained within the written text. Therefore, initiatives have been taken such as <a href="/wiki/Nature_(journal)" title="Nature (journal)">Nature's</a> proposal for an Open Text Mining Interface (OTMI) and the <a href="/wiki/National_Institutes_of_Health" title="National Institutes of Health">National Institutes of Health</a>'s common Journal Publishing <a href="/wiki/Document_Type_Definition" class="mw-redirect" title="Document Type Definition">Document Type Definition</a> (DTD) that would provide semantic cues to machines to answer specific queries contained within the text without removing publisher barriers to public access. </p><p>Academic institutions have also become involved in the text mining initiative: </p> <ul><li>The <a href="/wiki/National_Centre_for_Text_Mining" title="National Centre for Text Mining">National Centre for Text Mining</a> (NaCTeM), is the first publicly funded text mining centre in the world. NaCTeM is operated by the <a href="/wiki/University_of_Manchester" title="University of Manchester">University of Manchester</a><sup id="cite_ref-37" class="reference"><a href="#cite_note-37"><span class="cite-bracket">&#91;</span>37<span class="cite-bracket">&#93;</span></a></sup> in close collaboration with the Tsujii Lab,<sup id="cite_ref-38" class="reference"><a href="#cite_note-38"><span class="cite-bracket">&#91;</span>38<span class="cite-bracket">&#93;</span></a></sup> <a href="/wiki/University_of_Tokyo" title="University of Tokyo">University of Tokyo</a>.<sup id="cite_ref-39" class="reference"><a href="#cite_note-39"><span class="cite-bracket">&#91;</span>39<span class="cite-bracket">&#93;</span></a></sup> NaCTeM provides customised tools, research facilities and offers advice to the academic community. They are funded by the <a href="/wiki/Joint_Information_Systems_Committee" class="mw-redirect" title="Joint Information Systems Committee">Joint Information Systems Committee</a> (JISC) and two of the UK <a href="/wiki/Research_council_(United_Kingdom)" class="mw-redirect" title="Research council (United Kingdom)">research councils</a> (<a href="/wiki/EPSRC" class="mw-redirect" title="EPSRC">EPSRC</a> &amp; <a href="/wiki/BBSRC" class="mw-redirect" title="BBSRC">BBSRC</a>). With an initial focus on text mining in the <a href="/wiki/Biology" title="Biology">biological</a> and <a href="/wiki/Biomedical" class="mw-redirect" title="Biomedical">biomedical</a> sciences, research has since expanded into the areas of <a href="/wiki/Social_sciences" class="mw-redirect" title="Social sciences">social sciences</a>.</li> <li>In the United States, the <a href="/wiki/UC_Berkeley_School_of_Information" title="UC Berkeley School of Information">School of Information</a> at <a href="/wiki/University_of_California,_Berkeley" title="University of California, Berkeley">University of California, Berkeley</a> is developing a program called BioText to assist <a href="/wiki/Biology" title="Biology">biology</a> researchers in text mining and analysis.</li> <li>The <a href="/wiki/Text_Analysis_Portal_for_Research" title="Text Analysis Portal for Research">Text Analysis Portal for Research</a> (TAPoR), currently housed at the <a href="/wiki/University_of_Alberta" title="University of Alberta">University of Alberta</a>, is a scholarly project to catalogue text analysis applications and create a gateway for researchers new to the practice.</li></ul> <div class="mw-heading mw-heading4"><h4 id="Methods_for_scientific_literature_mining">Methods for scientific literature mining</h4><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=11" title="Edit section: Methods for scientific literature mining"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>Computational methods have been developed to assist with information retrieval from scientific literature. Published approaches include methods for searching,<sup id="cite_ref-40" class="reference"><a href="#cite_note-40"><span class="cite-bracket">&#91;</span>40<span class="cite-bracket">&#93;</span></a></sup> determining novelty,<sup id="cite_ref-41" class="reference"><a href="#cite_note-41"><span class="cite-bracket">&#91;</span>41<span class="cite-bracket">&#93;</span></a></sup> and clarifying <a href="/wiki/Homonym" title="Homonym">homonyms</a><sup id="cite_ref-42" class="reference"><a href="#cite_note-42"><span class="cite-bracket">&#91;</span>42<span class="cite-bracket">&#93;</span></a></sup> among technical reports. </p> <div class="mw-heading mw-heading3"><h3 id="Digital_humanities_and_computational_sociology">Digital humanities and computational sociology</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=12" title="Edit section: Digital humanities and computational sociology"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>The automatic analysis of vast textual corpora has created the possibility for scholars to analyze millions of documents in multiple languages with very limited manual intervention. Key enabling technologies have been parsing, <a href="/wiki/Machine_translation" title="Machine translation">machine translation</a>, topic <a href="/wiki/Categorization" class="mw-redirect" title="Categorization">categorization</a>, and machine learning. </p> <figure class="mw-default-size mw-halign-right" typeof="mw:File/Thumb"><a href="/wiki/File:Tripletsnew2012.png" class="mw-file-description"><img src="//upload.wikimedia.org/wikipedia/commons/thumb/4/43/Tripletsnew2012.png/220px-Tripletsnew2012.png" decoding="async" width="220" height="235" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/commons/thumb/4/43/Tripletsnew2012.png/330px-Tripletsnew2012.png 1.5x, //upload.wikimedia.org/wikipedia/commons/thumb/4/43/Tripletsnew2012.png/440px-Tripletsnew2012.png 2x" data-file-width="538" data-file-height="574" /></a><figcaption>Narrative network of US Elections 2012<sup id="cite_ref-ReferenceA_43-0" class="reference"><a href="#cite_note-ReferenceA-43"><span class="cite-bracket">&#91;</span>43<span class="cite-bracket">&#93;</span></a></sup></figcaption></figure> <p>The automatic parsing of textual corpora has enabled the extraction of actors and their relational networks on a vast scale, turning textual data into network data. The resulting networks, which can contain thousands of nodes, are then analyzed by using tools from network theory to identify the key actors, the key communities or parties, and general properties such as robustness or structural stability of the overall network, or centrality of certain nodes.<sup id="cite_ref-44" class="reference"><a href="#cite_note-44"><span class="cite-bracket">&#91;</span>44<span class="cite-bracket">&#93;</span></a></sup> This automates the approach introduced by quantitative narrative analysis,<sup id="cite_ref-45" class="reference"><a href="#cite_note-45"><span class="cite-bracket">&#91;</span>45<span class="cite-bracket">&#93;</span></a></sup> whereby <a href="/wiki/Subject-verb-object" class="mw-redirect" title="Subject-verb-object">subject-verb-object</a> triplets are identified with pairs of actors linked by an action, or pairs formed by actor-object.<sup id="cite_ref-ReferenceA_43-1" class="reference"><a href="#cite_note-ReferenceA-43"><span class="cite-bracket">&#91;</span>43<span class="cite-bracket">&#93;</span></a></sup> </p><p><a href="/wiki/Content_analysis" title="Content analysis">Content analysis</a> has been a traditional part of social sciences and media studies for a long time. The automation of content analysis has allowed a "<a href="/wiki/Big_data" title="Big data">big data</a>" revolution to take place in that field, with studies in social media and newspaper content that include millions of news items. <a href="/wiki/Gender_bias" class="mw-redirect" title="Gender bias">Gender bias</a>, <a href="/wiki/Readability" title="Readability">readability</a>, content similarity, reader preferences, and even mood have been analyzed based on text mining methods over millions of documents.<sup id="cite_ref-46" class="reference"><a href="#cite_note-46"><span class="cite-bracket">&#91;</span>46<span class="cite-bracket">&#93;</span></a></sup><sup id="cite_ref-47" class="reference"><a href="#cite_note-47"><span class="cite-bracket">&#91;</span>47<span class="cite-bracket">&#93;</span></a></sup><sup id="cite_ref-48" class="reference"><a href="#cite_note-48"><span class="cite-bracket">&#91;</span>48<span class="cite-bracket">&#93;</span></a></sup><sup id="cite_ref-49" class="reference"><a href="#cite_note-49"><span class="cite-bracket">&#91;</span>49<span class="cite-bracket">&#93;</span></a></sup><sup id="cite_ref-50" class="reference"><a href="#cite_note-50"><span class="cite-bracket">&#91;</span>50<span class="cite-bracket">&#93;</span></a></sup> The analysis of readability, gender bias and topic bias was demonstrated in Flaounas et al.<sup id="cite_ref-51" class="reference"><a href="#cite_note-51"><span class="cite-bracket">&#91;</span>51<span class="cite-bracket">&#93;</span></a></sup> showing how different topics have different gender biases and levels of readability; the possibility to detect mood patterns in a vast population by analyzing Twitter content was demonstrated as well.<sup id="cite_ref-52" class="reference"><a href="#cite_note-52"><span class="cite-bracket">&#91;</span>52<span class="cite-bracket">&#93;</span></a></sup><sup id="cite_ref-53" class="reference"><a href="#cite_note-53"><span class="cite-bracket">&#91;</span>53<span class="cite-bracket">&#93;</span></a></sup> </p> <div class="mw-heading mw-heading2"><h2 id="Software">Software</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=13" title="Edit section: Software"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236090951"><div role="note" class="hatnote navigation-not-searchable">Main article: <a href="/wiki/List_of_text_mining_software" title="List of text mining software">List of text mining software</a></div> <p>Text mining computer programs are available from many <a href="/wiki/Commercial_software" title="Commercial software">commercial</a> and <a href="/wiki/Open_source" title="Open source">open source</a> companies and sources. </p> <div class="mw-heading mw-heading2"><h2 id="Intellectual_property_law">Intellectual property law</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=14" title="Edit section: Intellectual property law"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <div class="mw-heading mw-heading3"><h3 id="Situation_in_Europe">Situation in Europe</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=15" title="Edit section: Situation in Europe"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <figure class="mw-default-size" typeof="mw:File/Thumb"><span><video id="mwe_player_0" poster="//upload.wikimedia.org/wikipedia/commons/thumb/1/15/FixCopyright-_Copyright_%26_Research_-_Text_%26_Data_Mining_%28TDM%29_Explained.webm/220px--FixCopyright-_Copyright_%26_Research_-_Text_%26_Data_Mining_%28TDM%29_Explained.webm.jpg" controls="" preload="none" data-mw-tmh="" class="mw-file-element" width="220" height="124" data-durationhint="232" data-mwtitle="FixCopyright-_Copyright_&amp;_Research_-_Text_&amp;_Data_Mining_(TDM)_Explained.webm" data-mwprovider="wikimediacommons" resource="/wiki/File:FixCopyright-_Copyright_%26_Research_-_Text_%26_Data_Mining_(TDM)_Explained.webm"><source src="//upload.wikimedia.org/wikipedia/commons/transcoded/1/15/FixCopyright-_Copyright_%26_Research_-_Text_%26_Data_Mining_%28TDM%29_Explained.webm/FixCopyright-_Copyright_%26_Research_-_Text_%26_Data_Mining_%28TDM%29_Explained.webm.480p.vp9.webm" type="video/webm; codecs=&quot;vp9, opus&quot;" data-transcodekey="480p.vp9.webm" data-width="854" data-height="480" /><source src="//upload.wikimedia.org/wikipedia/commons/transcoded/1/15/FixCopyright-_Copyright_%26_Research_-_Text_%26_Data_Mining_%28TDM%29_Explained.webm/FixCopyright-_Copyright_%26_Research_-_Text_%26_Data_Mining_%28TDM%29_Explained.webm.720p.vp9.webm" type="video/webm; codecs=&quot;vp9, opus&quot;" data-transcodekey="720p.vp9.webm" data-width="1280" data-height="720" /><source src="//upload.wikimedia.org/wikipedia/commons/transcoded/1/15/FixCopyright-_Copyright_%26_Research_-_Text_%26_Data_Mining_%28TDM%29_Explained.webm/FixCopyright-_Copyright_%26_Research_-_Text_%26_Data_Mining_%28TDM%29_Explained.webm.1080p.vp9.webm" type="video/webm; codecs=&quot;vp9, opus&quot;" data-transcodekey="1080p.vp9.webm" data-width="1920" data-height="1080" /><source src="//upload.wikimedia.org/wikipedia/commons/1/15/FixCopyright-_Copyright_%26_Research_-_Text_%26_Data_Mining_%28TDM%29_Explained.webm" type="video/webm; codecs=&quot;vp8, vorbis&quot;" data-width="1920" data-height="1080" /><source src="//upload.wikimedia.org/wikipedia/commons/transcoded/1/15/FixCopyright-_Copyright_%26_Research_-_Text_%26_Data_Mining_%28TDM%29_Explained.webm/FixCopyright-_Copyright_%26_Research_-_Text_%26_Data_Mining_%28TDM%29_Explained.webm.144p.mjpeg.mov" type="video/quicktime" data-transcodekey="144p.mjpeg.mov" data-width="256" data-height="144" /><source src="//upload.wikimedia.org/wikipedia/commons/transcoded/1/15/FixCopyright-_Copyright_%26_Research_-_Text_%26_Data_Mining_%28TDM%29_Explained.webm/FixCopyright-_Copyright_%26_Research_-_Text_%26_Data_Mining_%28TDM%29_Explained.webm.240p.vp9.webm" type="video/webm; codecs=&quot;vp9, opus&quot;" data-transcodekey="240p.vp9.webm" data-width="426" data-height="240" /><source src="//upload.wikimedia.org/wikipedia/commons/transcoded/1/15/FixCopyright-_Copyright_%26_Research_-_Text_%26_Data_Mining_%28TDM%29_Explained.webm/FixCopyright-_Copyright_%26_Research_-_Text_%26_Data_Mining_%28TDM%29_Explained.webm.360p.vp9.webm" type="video/webm; codecs=&quot;vp9, opus&quot;" data-transcodekey="360p.vp9.webm" data-width="640" data-height="360" /><source src="//upload.wikimedia.org/wikipedia/commons/transcoded/1/15/FixCopyright-_Copyright_%26_Research_-_Text_%26_Data_Mining_%28TDM%29_Explained.webm/FixCopyright-_Copyright_%26_Research_-_Text_%26_Data_Mining_%28TDM%29_Explained.webm.360p.webm" type="video/webm; codecs=&quot;vp8, vorbis&quot;" data-transcodekey="360p.webm" data-width="640" data-height="360" /></video></span><figcaption>Video by Fix Copyright campaign explaining TDM and its copyright issues in the EU, 2016 [3:51]</figcaption></figure> <p>Under <a href="/wiki/Copyright_law_of_the_European_Union" title="Copyright law of the European Union">European copyright</a> and <a href="/wiki/Database_Directive" title="Database Directive">database laws</a>, the mining of in-copyright works (such as by <a href="/wiki/Web_mining" class="mw-redirect" title="Web mining">web mining</a>) without the permission of the copyright owner is illegal. In the UK in 2014, on the recommendation of the <a href="/w/index.php?title=Hargreaves_review&amp;action=edit&amp;redlink=1" class="new" title="Hargreaves review (page does not exist)">Hargreaves review</a>, the government amended copyright law<sup id="cite_ref-54" class="reference"><a href="#cite_note-54"><span class="cite-bracket">&#91;</span>54<span class="cite-bracket">&#93;</span></a></sup> to allow text mining as a <a href="/wiki/Limitations_and_exceptions_to_copyright" title="Limitations and exceptions to copyright">limitation and exception</a>. It was the second country in the world to do so, following <a href="/wiki/Copyright_law_of_Japan" title="Copyright law of Japan">Japan</a>, which introduced a mining-specific exception in 2009. However, owing to the restriction of the <a href="/wiki/Information_Society_Directive" class="mw-redirect" title="Information Society Directive">Information Society Directive</a> (2001), the UK exception only allows content mining for non-commercial purposes. UK copyright law does not allow this provision to be overridden by contractual terms and conditions. </p><p>The <a href="/wiki/European_Commission" title="European Commission">European Commission</a> facilitated stakeholder discussion on text and <a href="/wiki/Data_mining" title="Data mining">data mining</a> in 2013, under the title of Licenses for Europe.<sup id="cite_ref-55" class="reference"><a href="#cite_note-55"><span class="cite-bracket">&#91;</span>55<span class="cite-bracket">&#93;</span></a></sup> The fact that the focus on the solution to this legal issue was licenses, and not limitations and exceptions to copyright law, led representatives of universities, researchers, libraries, civil society groups and <a href="/wiki/Open_access" title="Open access">open access</a> publishers to leave the stakeholder dialogue in May 2013.<sup id="cite_ref-56" class="reference"><a href="#cite_note-56"><span class="cite-bracket">&#91;</span>56<span class="cite-bracket">&#93;</span></a></sup> </p> <div class="mw-heading mw-heading3"><h3 id="Situation_in_the_United_States">Situation in the United States</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=16" title="Edit section: Situation in the United States"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p><a href="/wiki/Copyright_law_of_the_United_States" title="Copyright law of the United States">US copyright law</a>, and in particular its <a href="/wiki/Fair_use" title="Fair use">fair use</a> provisions, means that text mining in America, as well as other fair use countries such as Israel, Taiwan and South Korea, is viewed as being legal. As text mining is transformative, meaning that it does not supplant the original work, it is viewed as being lawful under fair use. For example, as part of the <a href="/wiki/Google_Book_Search_Settlement_Agreement" class="mw-redirect" title="Google Book Search Settlement Agreement">Google Book settlement</a> the presiding judge on the case ruled that Google's digitization project of in-copyright books was lawful, in part because of the transformative uses that the digitization project displayed—one such use being text and data mining.<sup id="cite_ref-57" class="reference"><a href="#cite_note-57"><span class="cite-bracket">&#91;</span>57<span class="cite-bracket">&#93;</span></a></sup> </p> <div class="mw-heading mw-heading3"><h3 id="Situation_in_Australia">Situation in Australia</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=17" title="Edit section: Situation in Australia"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>There is no exception in <a href="/wiki/Copyright_law_of_Australia" title="Copyright law of Australia">copyright law of Australia</a> for text or data mining within the <i><a href="/wiki/Copyright_Act_1968" class="mw-redirect" title="Copyright Act 1968">Copyright Act 1968</a></i>. The <a href="/wiki/Australian_Law_Reform_Commission" title="Australian Law Reform Commission">Australian Law Reform Commission</a> has noted that it is unlikely that the "research and study" <a href="/wiki/Fair_dealing" title="Fair dealing">fair dealing</a> exception would extend to cover such a topic either, given it would be beyond the "reasonable portion" requirement.<sup id="cite_ref-58" class="reference"><a href="#cite_note-58"><span class="cite-bracket">&#91;</span>58<span class="cite-bracket">&#93;</span></a></sup> </p> <div class="mw-heading mw-heading2"><h2 id="Implications">Implications</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=18" title="Edit section: Implications"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <p>Until recently, websites most often used text-based searches, which only found documents containing specific user-defined words or phrases. Now, through use of a <a href="/wiki/Semantic_web" class="mw-redirect" title="Semantic web">semantic web</a>, text mining can find content based on meaning and context (rather than just by a specific word). Additionally, text mining software can be used to build large dossiers of information about specific people and events. For example, large datasets based on data extracted from news reports can be built to facilitate social networks analysis or <a href="/wiki/Counter-intelligence" class="mw-redirect" title="Counter-intelligence">counter-intelligence</a>. In effect, the text mining software may act in a capacity similar to an <a href="/wiki/Intelligence_analyst" class="mw-redirect" title="Intelligence analyst">intelligence analyst</a> or research librarian, albeit with a more limited scope of analysis. Text mining is also used in some email <a href="/wiki/Spam_filter" class="mw-redirect" title="Spam filter">spam filters</a> as a way of determining the characteristics of messages that are likely to be advertisements or other unwanted material. Text mining plays an important role in determining financial <a href="/wiki/Market_sentiment" title="Market sentiment">market sentiment</a>. </p> <div class="mw-heading mw-heading2"><h2 id="See_also">See also</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=19" title="Edit section: See also"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <style data-mw-deduplicate="TemplateStyles:r1184024115">.mw-parser-output .div-col{margin-top:0.3em;column-width:30em}.mw-parser-output .div-col-small{font-size:90%}.mw-parser-output .div-col-rules{column-rule:1px solid #aaa}.mw-parser-output .div-col dl,.mw-parser-output .div-col ol,.mw-parser-output .div-col ul{margin-top:0}.mw-parser-output .div-col li,.mw-parser-output .div-col dd{page-break-inside:avoid;break-inside:avoid-column}</style><div class="div-col" style="column-width: 22em;"> <ul><li><a href="/wiki/Concept_mining" title="Concept mining">Concept mining</a></li> <li><a href="/wiki/Document_processing" title="Document processing">Document processing</a></li> <li><a href="/wiki/Full_text_search" class="mw-redirect" title="Full text search">Full text search</a></li> <li><a href="/wiki/List_of_text_mining_software" title="List of text mining software">List of text mining software</a></li> <li><a href="/wiki/Market_sentiment" title="Market sentiment">Market sentiment</a></li> <li><a href="/wiki/Name_resolution_(semantics_and_text_extraction)" title="Name resolution (semantics and text extraction)">Name resolution (semantics and text extraction)</a></li> <li><a href="/wiki/Named_entity_recognition" class="mw-redirect" title="Named entity recognition">Named entity recognition</a></li> <li><a href="/wiki/News_analytics" title="News analytics">News analytics</a></li> <li><a href="/wiki/Ontology_learning" title="Ontology learning">Ontology learning</a></li> <li><a href="/wiki/Record_linkage" title="Record linkage">Record linkage</a></li> <li><a href="/wiki/Sequential_pattern_mining" title="Sequential pattern mining">Sequential pattern mining</a> (string and sequence mining)</li> <li><a href="/wiki/W-shingling" title="W-shingling">w-shingling</a></li> <li><a href="/wiki/Web_mining" class="mw-redirect" title="Web mining">Web mining</a>, a task that may involve text mining (e.g. first find appropriate web pages by classifying crawled web pages, then extract the desired information from the text content of these pages considered relevant)</li></ul> </div> <div class="mw-heading mw-heading2"><h2 id="References">References</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=20" title="Edit section: References"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <div class="mw-heading mw-heading3"><h3 id="Citations">Citations</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=21" title="Edit section: Citations"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <style data-mw-deduplicate="TemplateStyles:r1239543626">.mw-parser-output .reflist{margin-bottom:0.5em;list-style-type:decimal}@media screen{.mw-parser-output .reflist{font-size:90%}}.mw-parser-output .reflist .references{font-size:100%;margin-bottom:0;list-style-type:inherit}.mw-parser-output .reflist-columns-2{column-width:30em}.mw-parser-output .reflist-columns-3{column-width:25em}.mw-parser-output .reflist-columns{margin-top:0.3em}.mw-parser-output .reflist-columns ol{margin-top:0}.mw-parser-output .reflist-columns li{page-break-inside:avoid;break-inside:avoid-column}.mw-parser-output .reflist-upper-alpha{list-style-type:upper-alpha}.mw-parser-output .reflist-upper-roman{list-style-type:upper-roman}.mw-parser-output .reflist-lower-alpha{list-style-type:lower-alpha}.mw-parser-output .reflist-lower-greek{list-style-type:lower-greek}.mw-parser-output .reflist-lower-roman{list-style-type:lower-roman}</style><div class="reflist"> <div class="mw-references-wrap mw-references-columns"><ol class="references"> <li id="cite_note-1"><span class="mw-cite-backlink"><b><a href="#cite_ref-1">^</a></b></span> <span class="reference-text"><style data-mw-deduplicate="TemplateStyles:r1238218222">.mw-parser-output cite.citation{font-style:inherit;word-wrap:break-word}.mw-parser-output .citation q{quotes:"\"""\"""'""'"}.mw-parser-output .citation:target{background-color:rgba(0,127,255,0.133)}.mw-parser-output .id-lock-free.id-lock-free a{background:url("//upload.wikimedia.org/wikipedia/commons/6/65/Lock-green.svg")right 0.1em center/9px no-repeat}.mw-parser-output .id-lock-limited.id-lock-limited a,.mw-parser-output .id-lock-registration.id-lock-registration a{background:url("//upload.wikimedia.org/wikipedia/commons/d/d6/Lock-gray-alt-2.svg")right 0.1em center/9px no-repeat}.mw-parser-output .id-lock-subscription.id-lock-subscription a{background:url("//upload.wikimedia.org/wikipedia/commons/a/aa/Lock-red-alt-2.svg")right 0.1em center/9px no-repeat}.mw-parser-output .cs1-ws-icon a{background:url("//upload.wikimedia.org/wikipedia/commons/4/4c/Wikisource-logo.svg")right 0.1em center/12px no-repeat}body:not(.skin-timeless):not(.skin-minerva) .mw-parser-output .id-lock-free a,body:not(.skin-timeless):not(.skin-minerva) .mw-parser-output .id-lock-limited a,body:not(.skin-timeless):not(.skin-minerva) .mw-parser-output .id-lock-registration a,body:not(.skin-timeless):not(.skin-minerva) .mw-parser-output .id-lock-subscription a,body:not(.skin-timeless):not(.skin-minerva) .mw-parser-output .cs1-ws-icon a{background-size:contain;padding:0 1em 0 0}.mw-parser-output .cs1-code{color:inherit;background:inherit;border:none;padding:inherit}.mw-parser-output .cs1-hidden-error{display:none;color:var(--color-error,#d33)}.mw-parser-output .cs1-visible-error{color:var(--color-error,#d33)}.mw-parser-output .cs1-maint{display:none;color:#085;margin-left:0.3em}.mw-parser-output .cs1-kern-left{padding-left:0.2em}.mw-parser-output .cs1-kern-right{padding-right:0.2em}.mw-parser-output .citation .mw-selflink{font-weight:inherit}@media screen{.mw-parser-output .cs1-format{font-size:95%}html.skin-theme-clientpref-night .mw-parser-output .cs1-maint{color:#18911f}}@media screen and (prefers-color-scheme:dark){html.skin-theme-clientpref-os .mw-parser-output .cs1-maint{color:#18911f}}</style><cite class="citation web cs1"><a rel="nofollow" class="external text" href="http://people.ischool.berkeley.edu/~hearst/text-mining.html">"Marti Hearst: What is Text Mining?"</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Marti+Hearst%3A+What+is+Text+Mining%3F&amp;rft_id=http%3A%2F%2Fpeople.ischool.berkeley.edu%2F~hearst%2Ftext-mining.html&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-2"><span class="mw-cite-backlink"><b><a href="#cite_ref-2">^</a></b></span> <span class="reference-text">Hotho, A., Nürnberger, A. and Paaß, G. (2005). "A brief survey of text mining". In Ldv Forum, Vol. 20(1), p. 19-62</span> </li> <li id="cite_note-3"><span class="mw-cite-backlink"><b><a href="#cite_ref-3">^</a></b></span> <span class="reference-text">Feldman, R. and Sanger, J. (2007). The text mining handbook. Cambridge University Press. New York</span> </li> <li id="cite_note-4"><span class="mw-cite-backlink"><b><a href="#cite_ref-4">^</a></b></span> <span class="reference-text"><a rel="nofollow" class="external autonumber" href="http://intelligent-enterprise.informationweek.com/blog/archives/2007/02/defining_text_a.html">[1]</a> <a rel="nofollow" class="external text" href="https://web.archive.org/web/20091129171151/http://intelligent-enterprise.informationweek.com/blog/archives/2007/02/defining_text_a.html">Archived</a> November 29, 2009, at the <a href="/wiki/Wayback_Machine" title="Wayback Machine">Wayback Machine</a></span> </li> <li id="cite_note-5"><span class="mw-cite-backlink"><b><a href="#cite_ref-5">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.cs.cmu.edu/~dunja/CFPWshKDD2000.html">"KDD-2000 Workshop on Text Mining – Call for Papers"</a>. Cs.cmu.edu<span class="reference-accessdate">. Retrieved <span class="nowrap">2015-02-23</span></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=KDD-2000+Workshop+on+Text+Mining+%E2%80%93+Call+for+Papers&amp;rft.pub=Cs.cmu.edu&amp;rft_id=https%3A%2F%2Fwww.cs.cmu.edu%2F~dunja%2FCFPWshKDD2000.html&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-6"><span class="mw-cite-backlink"><b><a href="#cite_ref-6">^</a></b></span> <span class="reference-text"><a rel="nofollow" class="external autonumber" href="http://www.ir.iit.edu/cikm2004/tutorials.html#T2">[2]</a> <a rel="nofollow" class="external text" href="https://web.archive.org/web/20120303042253/http://www.ir.iit.edu/cikm2004/tutorials.html#T2">Archived</a> March 3, 2012, at the <a href="/wiki/Wayback_Machine" title="Wayback Machine">Wayback Machine</a></span> </li> <li id="cite_note-7"><span class="mw-cite-backlink"><b><a href="#cite_ref-7">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFHobbsWalkerAmsler1982" class="citation book cs1">Hobbs, Jerry R.; Walker, Donald E.; Amsler, Robert A. (1982). "Natural language access to structured text". <i>Proceedings of the 9th conference on Computational linguistics</i>. Vol.&#160;1. pp.&#160;127–32. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.3115%2F991813.991833">10.3115/991813.991833</a>. <a href="/wiki/S2CID_(identifier)" class="mw-redirect" title="S2CID (identifier)">S2CID</a>&#160;<a rel="nofollow" class="external text" href="https://api.semanticscholar.org/CorpusID:6433117">6433117</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=bookitem&amp;rft.atitle=Natural+language+access+to+structured+text&amp;rft.btitle=Proceedings+of+the+9th+conference+on+Computational+linguistics&amp;rft.pages=127-32&amp;rft.date=1982&amp;rft_id=info%3Adoi%2F10.3115%2F991813.991833&amp;rft_id=https%3A%2F%2Fapi.semanticscholar.org%2FCorpusID%3A6433117%23id-name%3DS2CID&amp;rft.aulast=Hobbs&amp;rft.aufirst=Jerry+R.&amp;rft.au=Walker%2C+Donald+E.&amp;rft.au=Amsler%2C+Robert+A.&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-breakthroughanalysis1-8"><span class="mw-cite-backlink"><b><a href="#cite_ref-breakthroughanalysis1_8-0">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="http://breakthroughanalysis.com/2008/08/01/unstructured-data-and-the-80-percent-rule/">"Unstructured Data and the 80 Percent Rule"</a>. Breakthrough Analysis. August 2008<span class="reference-accessdate">. Retrieved <span class="nowrap">2015-02-23</span></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Unstructured+Data+and+the+80+Percent+Rule&amp;rft.pub=Breakthrough+Analysis&amp;rft.date=2008-08&amp;rft_id=http%3A%2F%2Fbreakthroughanalysis.com%2F2008%2F08%2F01%2Funstructured-data-and-the-80-percent-rule%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-9"><span class="mw-cite-backlink"><b><a href="#cite_ref-9">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFAntunes2018" class="citation thesis cs1 cs1-prop-foreign-lang-source">Antunes, João (2018-11-14). <a rel="nofollow" class="external text" href="http://www.teses.usp.br/teses/disponiveis/55/55134/tde-03012019-103253/"><i>Exploração de informações contextuais para enriquecimento semântico em representações de textos</i></a> (Mestrado em Ciências de Computação e Matemática Computacional thesis) (in Portuguese). São Carlos: Universidade de São Paulo. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://doi.org/10.11606%2Fd.55.2019.tde-03012019-103253">10.11606/d.55.2019.tde-03012019-103253</a></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Adissertation&amp;rft.title=Explora%C3%A7%C3%A3o+de+informa%C3%A7%C3%B5es+contextuais+para+enriquecimento+sem%C3%A2ntico+em+representa%C3%A7%C3%B5es+de+textos&amp;rft.degree=Mestrado+em+Ci%C3%AAncias+de+Computa%C3%A7%C3%A3o+e+Matem%C3%A1tica+Computacional&amp;rft.inst=Universidade+de+S%C3%A3o+Paulo&amp;rft.date=2018-11-14&amp;rft_id=info%3Adoi%2F10.11606%2Fd.55.2019.tde-03012019-103253&amp;rft.aulast=Antunes&amp;rft.aufirst=Jo%C3%A3o&amp;rft_id=http%3A%2F%2Fwww.teses.usp.br%2Fteses%2Fdisponiveis%2F55%2F55134%2Ftde-03012019-103253%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-10"><span class="mw-cite-backlink"><b><a href="#cite_ref-10">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFMoroRaganatoNavigli2014" class="citation journal cs1">Moro, Andrea; Raganato, Alessandro; Navigli, Roberto (December 2014). <a rel="nofollow" class="external text" href="https://doi.org/10.1162%2Ftacl_a_00179">"Entity Linking meets Word Sense Disambiguation: a Unified Approach"</a>. <i>Transactions of the Association for Computational Linguistics</i>. <b>2</b>: 231–244. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://doi.org/10.1162%2Ftacl_a_00179">10.1162/tacl_a_00179</a></span>. <a href="/wiki/ISSN_(identifier)" class="mw-redirect" title="ISSN (identifier)">ISSN</a>&#160;<a rel="nofollow" class="external text" href="https://search.worldcat.org/issn/2307-387X">2307-387X</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Transactions+of+the+Association+for+Computational+Linguistics&amp;rft.atitle=Entity+Linking+meets+Word+Sense+Disambiguation%3A+a+Unified+Approach&amp;rft.volume=2&amp;rft.pages=231-244&amp;rft.date=2014-12&amp;rft_id=info%3Adoi%2F10.1162%2Ftacl_a_00179&amp;rft.issn=2307-387X&amp;rft.aulast=Moro&amp;rft.aufirst=Andrea&amp;rft.au=Raganato%2C+Alessandro&amp;rft.au=Navigli%2C+Roberto&amp;rft_id=https%3A%2F%2Fdoi.org%2F10.1162%252Ftacl_a_00179&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-11"><span class="mw-cite-backlink"><b><a href="#cite_ref-11">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFChangTayLim2017" class="citation journal cs1">Chang, Wui Lee; Tay, Kai Meng; Lim, Chee Peng (2017-02-06). "A New Evolving Tree-Based Model with Local Re-learning for Document Clustering and Visualization". <i>Neural Processing Letters</i>. <b>46</b> (2): 379–409. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1007%2Fs11063-017-9597-3">10.1007/s11063-017-9597-3</a>. <a href="/wiki/ISSN_(identifier)" class="mw-redirect" title="ISSN (identifier)">ISSN</a>&#160;<a rel="nofollow" class="external text" href="https://search.worldcat.org/issn/1370-4621">1370-4621</a>. <a href="/wiki/S2CID_(identifier)" class="mw-redirect" title="S2CID (identifier)">S2CID</a>&#160;<a rel="nofollow" class="external text" href="https://api.semanticscholar.org/CorpusID:9100902">9100902</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Neural+Processing+Letters&amp;rft.atitle=A+New+Evolving+Tree-Based+Model+with+Local+Re-learning+for+Document+Clustering+and+Visualization&amp;rft.volume=46&amp;rft.issue=2&amp;rft.pages=379-409&amp;rft.date=2017-02-06&amp;rft_id=https%3A%2F%2Fapi.semanticscholar.org%2FCorpusID%3A9100902%23id-name%3DS2CID&amp;rft.issn=1370-4621&amp;rft_id=info%3Adoi%2F10.1007%2Fs11063-017-9597-3&amp;rft.aulast=Chang&amp;rft.aufirst=Wui+Lee&amp;rft.au=Tay%2C+Kai+Meng&amp;rft.au=Lim%2C+Chee+Peng&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-12"><span class="mw-cite-backlink"><b><a href="#cite_ref-12">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFBenchimolKazinnikSaadon2022" class="citation journal cs1">Benchimol, Jonathan; Kazinnik, Sophia; Saadon, Yossi (2022). <a rel="nofollow" class="external text" href="https://paperswithcode.com/paper/text-mining-methodologies-with-r-an">"Text mining methodologies with R: An application to central bank texts"</a>. <i>Machine Learning with Applications</i>. <b>8</b>: 100286. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://doi.org/10.1016%2Fj.mlwa.2022.100286">10.1016/j.mlwa.2022.100286</a></span>. <a href="/wiki/S2CID_(identifier)" class="mw-redirect" title="S2CID (identifier)">S2CID</a>&#160;<a rel="nofollow" class="external text" href="https://api.semanticscholar.org/CorpusID:243798160">243798160</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Machine+Learning+with+Applications&amp;rft.atitle=Text+mining+methodologies+with+R%3A+An+application+to+central+bank+texts&amp;rft.volume=8&amp;rft.pages=100286&amp;rft.date=2022&amp;rft_id=info%3Adoi%2F10.1016%2Fj.mlwa.2022.100286&amp;rft_id=https%3A%2F%2Fapi.semanticscholar.org%2FCorpusID%3A243798160%23id-name%3DS2CID&amp;rft.aulast=Benchimol&amp;rft.aufirst=Jonathan&amp;rft.au=Kazinnik%2C+Sophia&amp;rft.au=Saadon%2C+Yossi&amp;rft_id=https%3A%2F%2Fpaperswithcode.com%2Fpaper%2Ftext-mining-methodologies-with-r-an&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-13"><span class="mw-cite-backlink"><b><a href="#cite_ref-13">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFMehl2006" class="citation book cs1">Mehl, Matthias R. (2006). "Quantitative Text Analysis". <i>Handbook of multimethod measurement in psychology</i>. p.&#160;141. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1037%2F11383-011">10.1037/11383-011</a>. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&#160;<a href="/wiki/Special:BookSources/978-1-59147-318-3" title="Special:BookSources/978-1-59147-318-3"><bdi>978-1-59147-318-3</bdi></a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=bookitem&amp;rft.atitle=Quantitative+Text+Analysis&amp;rft.btitle=Handbook+of+multimethod+measurement+in+psychology&amp;rft.pages=141&amp;rft.date=2006&amp;rft_id=info%3Adoi%2F10.1037%2F11383-011&amp;rft.isbn=978-1-59147-318-3&amp;rft.aulast=Mehl&amp;rft.aufirst=Matthias+R.&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-14"><span class="mw-cite-backlink"><b><a href="#cite_ref-14">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFPangLee2008" class="citation journal cs1">Pang, Bo; <a href="/wiki/Lillian_Lee_(computer_scientist)" title="Lillian Lee (computer scientist)">Lee, Lillian</a> (2008). "Opinion Mining and Sentiment Analysis". <i>Foundations and Trends in Information Retrieval</i>. <b>2</b> (1–2): 1–135. <a href="/wiki/CiteSeerX_(identifier)" class="mw-redirect" title="CiteSeerX (identifier)">CiteSeerX</a>&#160;<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.147.2755">10.1.1.147.2755</a></span>. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1561%2F1500000011">10.1561/1500000011</a>. <a href="/wiki/ISSN_(identifier)" class="mw-redirect" title="ISSN (identifier)">ISSN</a>&#160;<a rel="nofollow" class="external text" href="https://search.worldcat.org/issn/1554-0669">1554-0669</a>. <a href="/wiki/S2CID_(identifier)" class="mw-redirect" title="S2CID (identifier)">S2CID</a>&#160;<a rel="nofollow" class="external text" href="https://api.semanticscholar.org/CorpusID:207178694">207178694</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Foundations+and+Trends+in+Information+Retrieval&amp;rft.atitle=Opinion+Mining+and+Sentiment+Analysis&amp;rft.volume=2&amp;rft.issue=1%E2%80%932&amp;rft.pages=1-135&amp;rft.date=2008&amp;rft_id=https%3A%2F%2Fciteseerx.ist.psu.edu%2Fviewdoc%2Fsummary%3Fdoi%3D10.1.1.147.2755%23id-name%3DCiteSeerX&amp;rft_id=https%3A%2F%2Fapi.semanticscholar.org%2FCorpusID%3A207178694%23id-name%3DS2CID&amp;rft.issn=1554-0669&amp;rft_id=info%3Adoi%2F10.1561%2F1500000011&amp;rft.aulast=Pang&amp;rft.aufirst=Bo&amp;rft.au=Lee%2C+Lillian&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-15"><span class="mw-cite-backlink"><b><a href="#cite_ref-15">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFPaltoglouThelwall2012" class="citation journal cs1">Paltoglou, Georgios; Thelwall, Mike (2012-09-01). "Twitter, MySpace, Digg: Unsupervised Sentiment Analysis in Social Media". <i>ACM Transactions on Intelligent Systems and Technology</i>. <b>3</b> (4): 66. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1145%2F2337542.2337551">10.1145/2337542.2337551</a>. <a href="/wiki/ISSN_(identifier)" class="mw-redirect" title="ISSN (identifier)">ISSN</a>&#160;<a rel="nofollow" class="external text" href="https://search.worldcat.org/issn/2157-6904">2157-6904</a>. <a href="/wiki/S2CID_(identifier)" class="mw-redirect" title="S2CID (identifier)">S2CID</a>&#160;<a rel="nofollow" class="external text" href="https://api.semanticscholar.org/CorpusID:16600444">16600444</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=ACM+Transactions+on+Intelligent+Systems+and+Technology&amp;rft.atitle=Twitter%2C+MySpace%2C+Digg%3A+Unsupervised+Sentiment+Analysis+in+Social+Media&amp;rft.volume=3&amp;rft.issue=4&amp;rft.pages=66&amp;rft.date=2012-09-01&amp;rft_id=https%3A%2F%2Fapi.semanticscholar.org%2FCorpusID%3A16600444%23id-name%3DS2CID&amp;rft.issn=2157-6904&amp;rft_id=info%3Adoi%2F10.1145%2F2337542.2337551&amp;rft.aulast=Paltoglou&amp;rft.aufirst=Georgios&amp;rft.au=Thelwall%2C+Mike&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-16"><span class="mw-cite-backlink"><b><a href="#cite_ref-16">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="http://alt.qcri.org/semeval2017/task4/">"Sentiment Analysis in Twitter &lt; SemEval-2017 Task 4"</a>. <i>alt.qcri.org</i><span class="reference-accessdate">. Retrieved <span class="nowrap">2018-10-02</span></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=alt.qcri.org&amp;rft.atitle=Sentiment+Analysis+in+Twitter+%3C+SemEval-2017+Task+4&amp;rft_id=http%3A%2F%2Falt.qcri.org%2Fsemeval2017%2Ftask4%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-17"><span class="mw-cite-backlink"><b><a href="#cite_ref-17">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFZanasi2009" class="citation book cs1">Zanasi, Alessandro (2009). "Virtual Weapons for Real Wars: Text Mining for National Security". <i>Proceedings of the International Workshop on Computational Intelligence in Security for Information Systems CISIS'08</i>. Advances in Soft Computing. Vol.&#160;53. p.&#160;53. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1007%2F978-3-540-88181-0_7">10.1007/978-3-540-88181-0_7</a>. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&#160;<a href="/wiki/Special:BookSources/978-3-540-88180-3" title="Special:BookSources/978-3-540-88180-3"><bdi>978-3-540-88180-3</bdi></a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=bookitem&amp;rft.atitle=Virtual+Weapons+for+Real+Wars%3A+Text+Mining+for+National+Security&amp;rft.btitle=Proceedings+of+the+International+Workshop+on+Computational+Intelligence+in+Security+for+Information+Systems+CISIS%2708&amp;rft.series=Advances+in+Soft+Computing&amp;rft.pages=53&amp;rft.date=2009&amp;rft_id=info%3Adoi%2F10.1007%2F978-3-540-88181-0_7&amp;rft.isbn=978-3-540-88180-3&amp;rft.aulast=Zanasi&amp;rft.aufirst=Alessandro&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-18"><span class="mw-cite-backlink"><b><a href="#cite_ref-18">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFBadalKundrotasVakser2015" class="citation journal cs1">Badal, Varsha D.; Kundrotas, Petras J.; Vakser, Ilya A. (2015-12-09). <a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC4674139">"Text Mining for Protein Docking"</a>. <i>PLOS Computational Biology</i>. <b>11</b> (12): e1004630. <a href="/wiki/Bibcode_(identifier)" class="mw-redirect" title="Bibcode (identifier)">Bibcode</a>:<a rel="nofollow" class="external text" href="https://ui.adsabs.harvard.edu/abs/2015PLSCB..11E4630B">2015PLSCB..11E4630B</a>. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://doi.org/10.1371%2Fjournal.pcbi.1004630">10.1371/journal.pcbi.1004630</a></span>. <a href="/wiki/ISSN_(identifier)" class="mw-redirect" title="ISSN (identifier)">ISSN</a>&#160;<a rel="nofollow" class="external text" href="https://search.worldcat.org/issn/1553-7358">1553-7358</a>. <a href="/wiki/PMC_(identifier)" class="mw-redirect" title="PMC (identifier)">PMC</a>&#160;<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC4674139">4674139</a></span>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&#160;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/26650466">26650466</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=PLOS+Computational+Biology&amp;rft.atitle=Text+Mining+for+Protein+Docking&amp;rft.volume=11&amp;rft.issue=12&amp;rft.pages=e1004630&amp;rft.date=2015-12-09&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC4674139%23id-name%3DPMC&amp;rft_id=info%3Abibcode%2F2015PLSCB..11E4630B&amp;rft_id=info%3Apmid%2F26650466&amp;rft_id=info%3Adoi%2F10.1371%2Fjournal.pcbi.1004630&amp;rft.issn=1553-7358&amp;rft.aulast=Badal&amp;rft.aufirst=Varsha+D.&amp;rft.au=Kundrotas%2C+Petras+J.&amp;rft.au=Vakser%2C+Ilya+A.&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC4674139&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-19"><span class="mw-cite-backlink"><b><a href="#cite_ref-19">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFCohenHunter2008" class="citation journal cs1">Cohen, K. Bretonnel; Hunter, Lawrence (2008). <a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC2217579">"Getting Started in Text Mining"</a>. <i>PLOS Computational Biology</i>. <b>4</b> (1): e20. <a href="/wiki/Bibcode_(identifier)" class="mw-redirect" title="Bibcode (identifier)">Bibcode</a>:<a rel="nofollow" class="external text" href="https://ui.adsabs.harvard.edu/abs/2008PLSCB...4...20C">2008PLSCB...4...20C</a>. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://doi.org/10.1371%2Fjournal.pcbi.0040020">10.1371/journal.pcbi.0040020</a></span>. <a href="/wiki/PMC_(identifier)" class="mw-redirect" title="PMC (identifier)">PMC</a>&#160;<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC2217579">2217579</a></span>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&#160;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/18225946">18225946</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=PLOS+Computational+Biology&amp;rft.atitle=Getting+Started+in+Text+Mining&amp;rft.volume=4&amp;rft.issue=1&amp;rft.pages=e20&amp;rft.date=2008&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC2217579%23id-name%3DPMC&amp;rft_id=info%3Apmid%2F18225946&amp;rft_id=info%3Adoi%2F10.1371%2Fjournal.pcbi.0040020&amp;rft_id=info%3Abibcode%2F2008PLSCB...4...20C&amp;rft.aulast=Cohen&amp;rft.aufirst=K.+Bretonnel&amp;rft.au=Hunter%2C+Lawrence&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC2217579&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-20"><span class="mw-cite-backlink"><b><a href="#cite_ref-20">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFBadalKundrotasVakser2015" class="citation journal cs1">Badal, V. D; Kundrotas, P. J; Vakser, I. A (2015). <a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC4674139">"Text mining for protein docking"</a>. <i>PLOS Computational Biology</i>. <b>11</b> (12): e1004630. <a href="/wiki/Bibcode_(identifier)" class="mw-redirect" title="Bibcode (identifier)">Bibcode</a>:<a rel="nofollow" class="external text" href="https://ui.adsabs.harvard.edu/abs/2015PLSCB..11E4630B">2015PLSCB..11E4630B</a>. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://doi.org/10.1371%2Fjournal.pcbi.1004630">10.1371/journal.pcbi.1004630</a></span>. <a href="/wiki/PMC_(identifier)" class="mw-redirect" title="PMC (identifier)">PMC</a>&#160;<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC4674139">4674139</a></span>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&#160;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/26650466">26650466</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=PLOS+Computational+Biology&amp;rft.atitle=Text+mining+for+protein+docking&amp;rft.volume=11&amp;rft.issue=12&amp;rft.pages=e1004630&amp;rft.date=2015&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC4674139%23id-name%3DPMC&amp;rft_id=info%3Apmid%2F26650466&amp;rft_id=info%3Adoi%2F10.1371%2Fjournal.pcbi.1004630&amp;rft_id=info%3Abibcode%2F2015PLSCB..11E4630B&amp;rft.aulast=Badal&amp;rft.aufirst=V.+D&amp;rft.au=Kundrotas%2C+P.+J&amp;rft.au=Vakser%2C+I.+A&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC4674139&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-21"><span class="mw-cite-backlink"><b><a href="#cite_ref-21">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFPapanikolaouPavlopoulosTheodosiouIliopoulos2015" class="citation journal cs1">Papanikolaou, Nikolas; Pavlopoulos, Georgios A.; Theodosiou, Theodosios; Iliopoulos, Ioannis (2015). "Protein–protein interaction predictions using text mining methods". <i>Methods</i>. <b>74</b>: 47–53. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1016%2Fj.ymeth.2014.10.026">10.1016/j.ymeth.2014.10.026</a>. <a href="/wiki/ISSN_(identifier)" class="mw-redirect" title="ISSN (identifier)">ISSN</a>&#160;<a rel="nofollow" class="external text" href="https://search.worldcat.org/issn/1046-2023">1046-2023</a>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&#160;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/25448298">25448298</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Methods&amp;rft.atitle=Protein%E2%80%93protein+interaction+predictions+using+text+mining+methods&amp;rft.volume=74&amp;rft.pages=47-53&amp;rft.date=2015&amp;rft.issn=1046-2023&amp;rft_id=info%3Apmid%2F25448298&amp;rft_id=info%3Adoi%2F10.1016%2Fj.ymeth.2014.10.026&amp;rft.aulast=Papanikolaou&amp;rft.aufirst=Nikolas&amp;rft.au=Pavlopoulos%2C+Georgios+A.&amp;rft.au=Theodosiou%2C+Theodosios&amp;rft.au=Iliopoulos%2C+Ioannis&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-22"><span class="mw-cite-backlink"><b><a href="#cite_ref-22">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFSzklarczykMorrisCookKuhn2016" class="citation journal cs1">Szklarczyk, Damian; Morris, John H; Cook, Helen; Kuhn, Michael; Wyder, Stefan; Simonovic, Milan; Santos, Alberto; Doncheva, Nadezhda T; Roth, Alexander (2016-10-18). <a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC5210637">"The STRING database in 2017: quality-controlled protein–protein association networks, made broadly accessible"</a>. <i>Nucleic Acids Research</i>. <b>45</b> (D1): D362–D368. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1093%2Fnar%2Fgkw937">10.1093/nar/gkw937</a>. <a href="/wiki/ISSN_(identifier)" class="mw-redirect" title="ISSN (identifier)">ISSN</a>&#160;<a rel="nofollow" class="external text" href="https://search.worldcat.org/issn/0305-1048">0305-1048</a>. <a href="/wiki/PMC_(identifier)" class="mw-redirect" title="PMC (identifier)">PMC</a>&#160;<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC5210637">5210637</a></span>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&#160;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/27924014">27924014</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Nucleic+Acids+Research&amp;rft.atitle=The+STRING+database+in+2017%3A+quality-controlled+protein%E2%80%93protein+association+networks%2C+made+broadly+accessible&amp;rft.volume=45&amp;rft.issue=D1&amp;rft.pages=D362-D368&amp;rft.date=2016-10-18&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC5210637%23id-name%3DPMC&amp;rft.issn=0305-1048&amp;rft_id=info%3Apmid%2F27924014&amp;rft_id=info%3Adoi%2F10.1093%2Fnar%2Fgkw937&amp;rft.aulast=Szklarczyk&amp;rft.aufirst=Damian&amp;rft.au=Morris%2C+John+H&amp;rft.au=Cook%2C+Helen&amp;rft.au=Kuhn%2C+Michael&amp;rft.au=Wyder%2C+Stefan&amp;rft.au=Simonovic%2C+Milan&amp;rft.au=Santos%2C+Alberto&amp;rft.au=Doncheva%2C+Nadezhda+T&amp;rft.au=Roth%2C+Alexander&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC5210637&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-23"><span class="mw-cite-backlink"><b><a href="#cite_ref-23">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFLiemMuraliSigdelShi2018" class="citation journal cs1">Liem, David A.; Murali, Sanjana; Sigdel, Dibakar; Shi, Yu; Wang, Xuan; Shen, Jiaming; Choi, Howard; Caufield, John H.; Wang, Wei; Ping, Peipei; Han, Jiawei (2018-10-01). <a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6230912">"Phrase mining of textual data to analyze extracellular matrix protein patterns across cardiovascular disease"</a>. <i>American Journal of Physiology. Heart and Circulatory Physiology</i>. <b>315</b> (4): H910–H924. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1152%2Fajpheart.00175.2018">10.1152/ajpheart.00175.2018</a>. <a href="/wiki/ISSN_(identifier)" class="mw-redirect" title="ISSN (identifier)">ISSN</a>&#160;<a rel="nofollow" class="external text" href="https://search.worldcat.org/issn/1522-1539">1522-1539</a>. <a href="/wiki/PMC_(identifier)" class="mw-redirect" title="PMC (identifier)">PMC</a>&#160;<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6230912">6230912</a></span>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&#160;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/29775406">29775406</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=American+Journal+of+Physiology.+Heart+and+Circulatory+Physiology&amp;rft.atitle=Phrase+mining+of+textual+data+to+analyze+extracellular+matrix+protein+patterns+across+cardiovascular+disease&amp;rft.volume=315&amp;rft.issue=4&amp;rft.pages=H910-H924&amp;rft.date=2018-10-01&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC6230912%23id-name%3DPMC&amp;rft.issn=1522-1539&amp;rft_id=info%3Apmid%2F29775406&amp;rft_id=info%3Adoi%2F10.1152%2Fajpheart.00175.2018&amp;rft.aulast=Liem&amp;rft.aufirst=David+A.&amp;rft.au=Murali%2C+Sanjana&amp;rft.au=Sigdel%2C+Dibakar&amp;rft.au=Shi%2C+Yu&amp;rft.au=Wang%2C+Xuan&amp;rft.au=Shen%2C+Jiaming&amp;rft.au=Choi%2C+Howard&amp;rft.au=Caufield%2C+John+H.&amp;rft.au=Wang%2C+Wei&amp;rft.au=Ping%2C+Peipei&amp;rft.au=Han%2C+Jiawei&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC6230912&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-24"><span class="mw-cite-backlink"><b><a href="#cite_ref-24">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFVan_LeMontgomeryKirkbyScanlan2018" class="citation journal cs1">Van Le, D; Montgomery, J; Kirkby, KC; Scanlan, J (10 August 2018). <a rel="nofollow" class="external text" href="https://doi.org/10.1016%2Fj.jbi.2018.08.007">"Risk Prediction using Natural Language Processing of Electronic Mental Health Records in an Inpatient Forensic Psychiatry Setting"</a>. <i>Journal of Biomedical Informatics</i>. <b>86</b>: 49–58. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://doi.org/10.1016%2Fj.jbi.2018.08.007">10.1016/j.jbi.2018.08.007</a></span>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&#160;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/30118855">30118855</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Journal+of+Biomedical+Informatics&amp;rft.atitle=Risk+Prediction+using+Natural+Language+Processing+of+Electronic+Mental+Health+Records+in+an+Inpatient+Forensic+Psychiatry+Setting.&amp;rft.volume=86&amp;rft.pages=49-58&amp;rft.date=2018-08-10&amp;rft_id=info%3Adoi%2F10.1016%2Fj.jbi.2018.08.007&amp;rft_id=info%3Apmid%2F30118855&amp;rft.aulast=Van+Le&amp;rft.aufirst=D&amp;rft.au=Montgomery%2C+J&amp;rft.au=Kirkby%2C+KC&amp;rft.au=Scanlan%2C+J&amp;rft_id=https%3A%2F%2Fdoi.org%2F10.1016%252Fj.jbi.2018.08.007&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-25"><span class="mw-cite-backlink"><b><a href="#cite_ref-25">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFJenssenLægreidKomorowskiHovig2001" class="citation journal cs1">Jenssen, Tor-Kristian; Lægreid, Astrid; Komorowski, Jan; Hovig, Eivind (2001). "A literature network of human genes for high-throughput analysis of gene expression". <i>Nature Genetics</i>. <b>28</b> (1): 21–8. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1038%2Fng0501-21">10.1038/ng0501-21</a>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&#160;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/11326270">11326270</a>. <a href="/wiki/S2CID_(identifier)" class="mw-redirect" title="S2CID (identifier)">S2CID</a>&#160;<a rel="nofollow" class="external text" href="https://api.semanticscholar.org/CorpusID:8889284">8889284</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Nature+Genetics&amp;rft.atitle=A+literature+network+of+human+genes+for+high-throughput+analysis+of+gene+expression&amp;rft.volume=28&amp;rft.issue=1&amp;rft.pages=21-8&amp;rft.date=2001&amp;rft_id=https%3A%2F%2Fapi.semanticscholar.org%2FCorpusID%3A8889284%23id-name%3DS2CID&amp;rft_id=info%3Apmid%2F11326270&amp;rft_id=info%3Adoi%2F10.1038%2Fng0501-21&amp;rft.aulast=Jenssen&amp;rft.aufirst=Tor-Kristian&amp;rft.au=L%C3%A6greid%2C+Astrid&amp;rft.au=Komorowski%2C+Jan&amp;rft.au=Hovig%2C+Eivind&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-26"><span class="mw-cite-backlink"><b><a href="#cite_ref-26">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFMasys2001" class="citation journal cs1">Masys, Daniel R. (2001). "Linking microarray data to the literature". <i>Nature Genetics</i>. <b>28</b> (1): 9–10. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1038%2Fng0501-9">10.1038/ng0501-9</a>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&#160;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/11326264">11326264</a>. <a href="/wiki/S2CID_(identifier)" class="mw-redirect" title="S2CID (identifier)">S2CID</a>&#160;<a rel="nofollow" class="external text" href="https://api.semanticscholar.org/CorpusID:52848745">52848745</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Nature+Genetics&amp;rft.atitle=Linking+microarray+data+to+the+literature&amp;rft.volume=28&amp;rft.issue=1&amp;rft.pages=9-10&amp;rft.date=2001&amp;rft_id=https%3A%2F%2Fapi.semanticscholar.org%2FCorpusID%3A52848745%23id-name%3DS2CID&amp;rft_id=info%3Apmid%2F11326264&amp;rft_id=info%3Adoi%2F10.1038%2Fng0501-9&amp;rft.aulast=Masys&amp;rft.aufirst=Daniel+R.&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-27"><span class="mw-cite-backlink"><b><a href="#cite_ref-27">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFRenganathan2017" class="citation journal cs1">Renganathan, Vinaitheerthan (2017). <a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC5572517">"Text Mining in Biomedical Domain with Emphasis on Document Clustering"</a>. <i>Healthcare Informatics Research</i>. <b>23</b> (3): 141–146. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.4258%2Fhir.2017.23.3.141">10.4258/hir.2017.23.3.141</a>. <a href="/wiki/ISSN_(identifier)" class="mw-redirect" title="ISSN (identifier)">ISSN</a>&#160;<a rel="nofollow" class="external text" href="https://search.worldcat.org/issn/2093-3681">2093-3681</a>. <a href="/wiki/PMC_(identifier)" class="mw-redirect" title="PMC (identifier)">PMC</a>&#160;<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC5572517">5572517</a></span>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&#160;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/28875048">28875048</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Healthcare+Informatics+Research&amp;rft.atitle=Text+Mining+in+Biomedical+Domain+with+Emphasis+on+Document+Clustering&amp;rft.volume=23&amp;rft.issue=3&amp;rft.pages=141-146&amp;rft.date=2017&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC5572517%23id-name%3DPMC&amp;rft.issn=2093-3681&amp;rft_id=info%3Apmid%2F28875048&amp;rft_id=info%3Adoi%2F10.4258%2Fhir.2017.23.3.141&amp;rft.aulast=Renganathan&amp;rft.aufirst=Vinaitheerthan&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC5572517&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-28"><span class="mw-cite-backlink"><b><a href="#cite_ref-28">^</a></b></span> <span class="reference-text"><a rel="nofollow" class="external autonumber" href="http://yatsko.zohosites.com/texor-a-chat-mining-program.html">[3]</a> <a rel="nofollow" class="external text" href="https://web.archive.org/web/20131004224652/http://yatsko.zohosites.com/texor-a-chat-mining-program.html">Archived</a> October 4, 2013, at the <a href="/wiki/Wayback_Machine" title="Wayback Machine">Wayback Machine</a></span> </li> <li id="cite_note-Text_Analytics:_The_Why_Behind_the_Score-29"><span class="mw-cite-backlink"><b><a href="#cite_ref-Text_Analytics:_The_Why_Behind_the_Score_29-0">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="http://www.medallia.com/text-analytics/">"Text Analytics"</a>. Medallia<span class="reference-accessdate">. Retrieved <span class="nowrap">2015-02-23</span></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Text+Analytics&amp;rft.pub=Medallia&amp;rft_id=http%3A%2F%2Fwww.medallia.com%2Ftext-analytics%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-10.1016/j.im.2008.01.005-30"><span class="mw-cite-backlink">^ <a href="#cite_ref-10.1016/j.im.2008.01.005_30-0"><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-10.1016/j.im.2008.01.005_30-1"><sup><i><b>b</b></i></sup></a></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFCoussementVan_Den_Poel2008" class="citation journal cs1">Coussement, Kristof; Van Den Poel, Dirk (2008). <a rel="nofollow" class="external text" href="http://econpapers.repec.org/RePEc:rug:rugwps:08/502">"Integrating the voice of customers through call center emails into a decision support system for churn prediction"</a>. <i>Information &amp; Management</i>. <b>45</b> (3): 164–74. <a href="/wiki/CiteSeerX_(identifier)" class="mw-redirect" title="CiteSeerX (identifier)">CiteSeerX</a>&#160;<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.113.3238">10.1.1.113.3238</a></span>. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1016%2Fj.im.2008.01.005">10.1016/j.im.2008.01.005</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Information+%26+Management&amp;rft.atitle=Integrating+the+voice+of+customers+through+call+center+emails+into+a+decision+support+system+for+churn+prediction&amp;rft.volume=45&amp;rft.issue=3&amp;rft.pages=164-74&amp;rft.date=2008&amp;rft_id=https%3A%2F%2Fciteseerx.ist.psu.edu%2Fviewdoc%2Fsummary%3Fdoi%3D10.1.1.113.3238%23id-name%3DCiteSeerX&amp;rft_id=info%3Adoi%2F10.1016%2Fj.im.2008.01.005&amp;rft.aulast=Coussement&amp;rft.aufirst=Kristof&amp;rft.au=Van+Den+Poel%2C+Dirk&amp;rft_id=http%3A%2F%2Feconpapers.repec.org%2FRePEc%3Arug%3Arugwps%3A08%2F502&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-31"><span class="mw-cite-backlink"><b><a href="#cite_ref-31">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFCoussementVan_Den_Poel2008" class="citation journal cs1">Coussement, Kristof; Van Den Poel, Dirk (2008). <a rel="nofollow" class="external text" href="http://econpapers.repec.org/RePEc:rug:rugwps:07/481">"Improving customer complaint management by automatic email classification using linguistic style features as predictors"</a>. <i>Decision Support Systems</i>. <b>44</b> (4): 870–82. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1016%2Fj.dss.2007.10.010">10.1016/j.dss.2007.10.010</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Decision+Support+Systems&amp;rft.atitle=Improving+customer+complaint+management+by+automatic+email+classification+using+linguistic+style+features+as+predictors&amp;rft.volume=44&amp;rft.issue=4&amp;rft.pages=870-82&amp;rft.date=2008&amp;rft_id=info%3Adoi%2F10.1016%2Fj.dss.2007.10.010&amp;rft.aulast=Coussement&amp;rft.aufirst=Kristof&amp;rft.au=Van+Den+Poel%2C+Dirk&amp;rft_id=http%3A%2F%2Feconpapers.repec.org%2FRePEc%3Arug%3Arugwps%3A07%2F481&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-Galvez2017-32"><span class="mw-cite-backlink"><b><a href="#cite_ref-Galvez2017_32-0">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFRamiro_H._GálvezAgustín_Gravano2017" class="citation journal cs1">Ramiro H. Gálvez; Agustín Gravano (2017). "Assessing the usefulness of online message board mining in automatic stock prediction systems". <i>Journal of Computational Science</i>. <b>19</b>: 1877–7503. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1016%2Fj.jocs.2017.01.001">10.1016/j.jocs.2017.01.001</a>. <a href="/wiki/Hdl_(identifier)" class="mw-redirect" title="Hdl (identifier)">hdl</a>:<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://hdl.handle.net/11336%2F60065">11336/60065</a></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Journal+of+Computational+Science&amp;rft.atitle=Assessing+the+usefulness+of+online+message+board+mining+in+automatic+stock+prediction+systems&amp;rft.volume=19&amp;rft.pages=1877-7503&amp;rft.date=2017&amp;rft_id=info%3Ahdl%2F11336%2F60065&amp;rft_id=info%3Adoi%2F10.1016%2Fj.jocs.2017.01.001&amp;rft.au=Ramiro+H.+G%C3%A1lvez&amp;rft.au=Agust%C3%ADn+Gravano&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-33"><span class="mw-cite-backlink"><b><a href="#cite_ref-33">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFPangLeeVaithyanathan2002" class="citation book cs1">Pang, Bo; Lee, Lillian; Vaithyanathan, Shivakumar (2002). "Thumbs up?". <i>Proceedings of the ACL-02 conference on Empirical methods in natural language processing</i>. Vol.&#160;10. pp.&#160;79–86. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.3115%2F1118693.1118704">10.3115/1118693.1118704</a>. <a href="/wiki/S2CID_(identifier)" class="mw-redirect" title="S2CID (identifier)">S2CID</a>&#160;<a rel="nofollow" class="external text" href="https://api.semanticscholar.org/CorpusID:7105713">7105713</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=bookitem&amp;rft.atitle=Thumbs+up%3F&amp;rft.btitle=Proceedings+of+the+ACL-02+conference+on+Empirical+methods+in+natural+language+processing&amp;rft.pages=79-86&amp;rft.date=2002&amp;rft_id=info%3Adoi%2F10.3115%2F1118693.1118704&amp;rft_id=https%3A%2F%2Fapi.semanticscholar.org%2FCorpusID%3A7105713%23id-name%3DS2CID&amp;rft.aulast=Pang&amp;rft.aufirst=Bo&amp;rft.au=Lee%2C+Lillian&amp;rft.au=Vaithyanathan%2C+Shivakumar&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-34"><span class="mw-cite-backlink"><b><a href="#cite_ref-34">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFAlessandro_ValituttiCarlo_StrapparavaOliviero_Stock2005" class="citation journal cs1">Alessandro Valitutti; Carlo Strapparava; Oliviero Stock (2005). <a rel="nofollow" class="external text" href="http://www.psychnology.org/File/PSYCHNOLOGY_JOURNAL_2_1_VALITUTTI.pdf">"Developing Affective Lexical Resources"</a> <span class="cs1-format">(PDF)</span>. <i>PsychNology Journal</i>. <b>2</b> (1): 61–83.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=PsychNology+Journal&amp;rft.atitle=Developing+Affective+Lexical+Resources&amp;rft.volume=2&amp;rft.issue=1&amp;rft.pages=61-83&amp;rft.date=2005&amp;rft.au=Alessandro+Valitutti&amp;rft.au=Carlo+Strapparava&amp;rft.au=Oliviero+Stock&amp;rft_id=http%3A%2F%2Fwww.psychnology.org%2FFile%2FPSYCHNOLOGY_JOURNAL_2_1_VALITUTTI.pdf&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-camnet-35"><span class="mw-cite-backlink"><b><a href="#cite_ref-camnet_35-0">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFErik_CambriaRobert_SpeerCatherine_HavasiAmir_Hussain2010" class="citation conference cs1">Erik Cambria; Robert Speer; Catherine Havasi; Amir Hussain (2010). <a rel="nofollow" class="external text" href="http://www.aaai.org/ocs/index.php/FSS/FSS10/paper/download/2216/2617.pdf">"SenticNet: a Publicly Available Semantic Resource for Opinion Mining"</a> <span class="cs1-format">(PDF)</span>. <i>Proceedings of AAAI CSK</i>. pp.&#160;14–18.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=conference&amp;rft.atitle=SenticNet%3A+a+Publicly+Available+Semantic+Resource+for+Opinion+Mining&amp;rft.btitle=Proceedings+of+AAAI+CSK&amp;rft.pages=14-18&amp;rft.date=2010&amp;rft.au=Erik+Cambria&amp;rft.au=Robert+Speer&amp;rft.au=Catherine+Havasi&amp;rft.au=Amir+Hussain&amp;rft_id=http%3A%2F%2Fwww.aaai.org%2Focs%2Findex.php%2FFSS%2FFSS10%2Fpaper%2Fdownload%2F2216%2F2617.pdf&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-36"><span class="mw-cite-backlink"><b><a href="#cite_ref-36">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFCalvod&#39;Mello2010" class="citation journal cs1">Calvo, Rafael A; d'Mello, Sidney (2010). "Affect Detection: An Interdisciplinary Review of Models, Methods, and Their Applications". <i>IEEE Transactions on Affective Computing</i>. <b>1</b> (1): 18–37. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1109%2FT-AFFC.2010.1">10.1109/T-AFFC.2010.1</a>. <a href="/wiki/S2CID_(identifier)" class="mw-redirect" title="S2CID (identifier)">S2CID</a>&#160;<a rel="nofollow" class="external text" href="https://api.semanticscholar.org/CorpusID:753606">753606</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=IEEE+Transactions+on+Affective+Computing&amp;rft.atitle=Affect+Detection%3A+An+Interdisciplinary+Review+of+Models%2C+Methods%2C+and+Their+Applications&amp;rft.volume=1&amp;rft.issue=1&amp;rft.pages=18-37&amp;rft.date=2010&amp;rft_id=info%3Adoi%2F10.1109%2FT-AFFC.2010.1&amp;rft_id=https%3A%2F%2Fapi.semanticscholar.org%2FCorpusID%3A753606%23id-name%3DS2CID&amp;rft.aulast=Calvo&amp;rft.aufirst=Rafael+A&amp;rft.au=d%27Mello%2C+Sidney&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-37"><span class="mw-cite-backlink"><b><a href="#cite_ref-37">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="http://www.manchester.ac.uk">"The University of Manchester"</a>. Manchester.ac.uk<span class="reference-accessdate">. Retrieved <span class="nowrap">2015-02-23</span></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=The+University+of+Manchester&amp;rft.pub=Manchester.ac.uk&amp;rft_id=http%3A%2F%2Fwww.manchester.ac.uk&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-38"><span class="mw-cite-backlink"><b><a href="#cite_ref-38">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://web.archive.org/web/20120307231425/http://www-tsujii.is.s.u-tokyo.ac.jp/index.html">"Tsujii Laboratory"</a>. Tsujii.is.s.u-tokyo.ac.jp. Archived from <a rel="nofollow" class="external text" href="http://www-tsujii.is.s.u-tokyo.ac.jp/index.html">the original</a> on 2012-03-07<span class="reference-accessdate">. Retrieved <span class="nowrap">2015-02-23</span></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=Tsujii+Laboratory&amp;rft.pub=Tsujii.is.s.u-tokyo.ac.jp&amp;rft_id=http%3A%2F%2Fwww-tsujii.is.s.u-tokyo.ac.jp%2Findex.html&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-39"><span class="mw-cite-backlink"><b><a href="#cite_ref-39">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="http://www.u-tokyo.ac.jp/index_e.html">"The University of Tokyo"</a>. UTokyo<span class="reference-accessdate">. Retrieved <span class="nowrap">2015-02-23</span></span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=unknown&amp;rft.btitle=The+University+of+Tokyo&amp;rft.pub=UTokyo&amp;rft_id=http%3A%2F%2Fwww.u-tokyo.ac.jp%2Findex_e.html&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-40"><span class="mw-cite-backlink"><b><a href="#cite_ref-40">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFShenXiaoHeShang2018" class="citation book cs1">Shen, Jiaming; Xiao, Jinfeng; He, Xinwei; Shang, Jingbo; Sinha, Saurabh; Han, Jiawei (2018-06-27). <i>Entity Set Search of Scientific Literature: An Unsupervised Ranking Approach</i>. ACM. pp.&#160;565–574. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1145%2F3209978.3210055">10.1145/3209978.3210055</a>. <a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&#160;<a href="/wiki/Special:BookSources/978-1-4503-5657-2" title="Special:BookSources/978-1-4503-5657-2"><bdi>978-1-4503-5657-2</bdi></a>. <a href="/wiki/S2CID_(identifier)" class="mw-redirect" title="S2CID (identifier)">S2CID</a>&#160;<a rel="nofollow" class="external text" href="https://api.semanticscholar.org/CorpusID:13748283">13748283</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Abook&amp;rft.genre=book&amp;rft.btitle=Entity+Set+Search+of+Scientific+Literature%3A+An+Unsupervised+Ranking+Approach&amp;rft.pages=565-574&amp;rft.pub=ACM&amp;rft.date=2018-06-27&amp;rft_id=https%3A%2F%2Fapi.semanticscholar.org%2FCorpusID%3A13748283%23id-name%3DS2CID&amp;rft_id=info%3Adoi%2F10.1145%2F3209978.3210055&amp;rft.isbn=978-1-4503-5657-2&amp;rft.aulast=Shen&amp;rft.aufirst=Jiaming&amp;rft.au=Xiao%2C+Jinfeng&amp;rft.au=He%2C+Xinwei&amp;rft.au=Shang%2C+Jingbo&amp;rft.au=Sinha%2C+Saurabh&amp;rft.au=Han%2C+Jiawei&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-41"><span class="mw-cite-backlink"><b><a href="#cite_ref-41">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFWalterRadauerMoehrle2017" class="citation journal cs1">Walter, Lothar; Radauer, Alfred; Moehrle, Martin G. (2017-02-06). "The beauty of brimstone butterfly: novelty of patents identified by near environment analysis based on text mining". <i>Scientometrics</i>. <b>111</b> (1): 103–115. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1007%2Fs11192-017-2267-4">10.1007/s11192-017-2267-4</a>. <a href="/wiki/ISSN_(identifier)" class="mw-redirect" title="ISSN (identifier)">ISSN</a>&#160;<a rel="nofollow" class="external text" href="https://search.worldcat.org/issn/0138-9130">0138-9130</a>. <a href="/wiki/S2CID_(identifier)" class="mw-redirect" title="S2CID (identifier)">S2CID</a>&#160;<a rel="nofollow" class="external text" href="https://api.semanticscholar.org/CorpusID:11174676">11174676</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Scientometrics&amp;rft.atitle=The+beauty+of+brimstone+butterfly%3A+novelty+of+patents+identified+by+near+environment+analysis+based+on+text+mining&amp;rft.volume=111&amp;rft.issue=1&amp;rft.pages=103-115&amp;rft.date=2017-02-06&amp;rft_id=https%3A%2F%2Fapi.semanticscholar.org%2FCorpusID%3A11174676%23id-name%3DS2CID&amp;rft.issn=0138-9130&amp;rft_id=info%3Adoi%2F10.1007%2Fs11192-017-2267-4&amp;rft.aulast=Walter&amp;rft.aufirst=Lothar&amp;rft.au=Radauer%2C+Alfred&amp;rft.au=Moehrle%2C+Martin+G.&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-42"><span class="mw-cite-backlink"><b><a href="#cite_ref-42">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFRollCorreiaBerger-Tal2018" class="citation journal cs1">Roll, Uri; Correia, Ricardo A.; Berger-Tal, Oded (2018-03-10). "Using machine learning to disentangle homonyms in large text corpora". <i>Conservation Biology</i>. <b>32</b> (3): 716–724. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<a rel="nofollow" class="external text" href="https://doi.org/10.1111%2Fcobi.13044">10.1111/cobi.13044</a>. <a href="/wiki/ISSN_(identifier)" class="mw-redirect" title="ISSN (identifier)">ISSN</a>&#160;<a rel="nofollow" class="external text" href="https://search.worldcat.org/issn/0888-8892">0888-8892</a>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&#160;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/29086438">29086438</a>. <a href="/wiki/S2CID_(identifier)" class="mw-redirect" title="S2CID (identifier)">S2CID</a>&#160;<a rel="nofollow" class="external text" href="https://api.semanticscholar.org/CorpusID:3783779">3783779</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Conservation+Biology&amp;rft.atitle=Using+machine+learning+to+disentangle+homonyms+in+large+text+corpora&amp;rft.volume=32&amp;rft.issue=3&amp;rft.pages=716-724&amp;rft.date=2018-03-10&amp;rft.issn=0888-8892&amp;rft_id=https%3A%2F%2Fapi.semanticscholar.org%2FCorpusID%3A3783779%23id-name%3DS2CID&amp;rft_id=info%3Apmid%2F29086438&amp;rft_id=info%3Adoi%2F10.1111%2Fcobi.13044&amp;rft.aulast=Roll&amp;rft.aufirst=Uri&amp;rft.au=Correia%2C+Ricardo+A.&amp;rft.au=Berger-Tal%2C+Oded&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-ReferenceA-43"><span class="mw-cite-backlink">^ <a href="#cite_ref-ReferenceA_43-0"><sup><i><b>a</b></i></sup></a> <a href="#cite_ref-ReferenceA_43-1"><sup><i><b>b</b></i></sup></a></span> <span class="reference-text">Automated analysis of the US presidential elections using Big Data and network analysis; S Sudhahar, GA Veltri, N Cristianini; Big Data &amp; Society 2 (1), 1-28, 2015</span> </li> <li id="cite_note-44"><span class="mw-cite-backlink"><b><a href="#cite_ref-44">^</a></b></span> <span class="reference-text">Network analysis of narrative content in large corpora; S Sudhahar, G De Fazio, R Franzosi, N Cristianini; Natural Language Engineering, 1-32, 2013</span> </li> <li id="cite_note-45"><span class="mw-cite-backlink"><b><a href="#cite_ref-45">^</a></b></span> <span class="reference-text">Quantitative Narrative Analysis; Roberto Franzosi; Emory University © 2010</span> </li> <li id="cite_note-46"><span class="mw-cite-backlink"><b><a href="#cite_ref-46">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite id="CITEREFLansdall-WelfareSudhaharThompsonLewis2017" class="citation journal cs1">Lansdall-Welfare, Thomas; Sudhahar, Saatviga; Thompson, James; Lewis, Justin; Team, FindMyPast Newspaper; Cristianini, Nello (2017-01-09). <a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC5278459">"Content analysis of 150 years of British periodicals"</a>. <i>Proceedings of the National Academy of Sciences</i>. <b>114</b> (4): E457–E465. <a href="/wiki/Bibcode_(identifier)" class="mw-redirect" title="Bibcode (identifier)">Bibcode</a>:<a rel="nofollow" class="external text" href="https://ui.adsabs.harvard.edu/abs/2017PNAS..114E.457L">2017PNAS..114E.457L</a>. <a href="/wiki/Doi_(identifier)" class="mw-redirect" title="Doi (identifier)">doi</a>:<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://doi.org/10.1073%2Fpnas.1606380114">10.1073/pnas.1606380114</a></span>. <a href="/wiki/ISSN_(identifier)" class="mw-redirect" title="ISSN (identifier)">ISSN</a>&#160;<a rel="nofollow" class="external text" href="https://search.worldcat.org/issn/0027-8424">0027-8424</a>. <a href="/wiki/PMC_(identifier)" class="mw-redirect" title="PMC (identifier)">PMC</a>&#160;<span class="id-lock-free" title="Freely accessible"><a rel="nofollow" class="external text" href="https://www.ncbi.nlm.nih.gov/pmc/articles/PMC5278459">5278459</a></span>. <a href="/wiki/PMID_(identifier)" class="mw-redirect" title="PMID (identifier)">PMID</a>&#160;<a rel="nofollow" class="external text" href="https://pubmed.ncbi.nlm.nih.gov/28069962">28069962</a>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Proceedings+of+the+National+Academy+of+Sciences&amp;rft.atitle=Content+analysis+of+150+years+of+British+periodicals&amp;rft.volume=114&amp;rft.issue=4&amp;rft.pages=E457-E465&amp;rft.date=2017-01-09&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC5278459%23id-name%3DPMC&amp;rft_id=info%3Abibcode%2F2017PNAS..114E.457L&amp;rft_id=info%3Apmid%2F28069962&amp;rft_id=info%3Adoi%2F10.1073%2Fpnas.1606380114&amp;rft.issn=0027-8424&amp;rft.aulast=Lansdall-Welfare&amp;rft.aufirst=Thomas&amp;rft.au=Sudhahar%2C+Saatviga&amp;rft.au=Thompson%2C+James&amp;rft.au=Lewis%2C+Justin&amp;rft.au=Team%2C+FindMyPast+Newspaper&amp;rft.au=Cristianini%2C+Nello&amp;rft_id=https%3A%2F%2Fwww.ncbi.nlm.nih.gov%2Fpmc%2Farticles%2FPMC5278459&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-47"><span class="mw-cite-backlink"><b><a href="#cite_ref-47">^</a></b></span> <span class="reference-text">I. Flaounas, M. Turchi, O. Ali, N. Fyson, T. De Bie, N. Mosdell, J. Lewis, N. Cristianini, The Structure of EU Mediasphere, PLoS ONE, Vol. 5(12), pp. e14243, 2010.</span> </li> <li id="cite_note-48"><span class="mw-cite-backlink"><b><a href="#cite_ref-48">^</a></b></span> <span class="reference-text">Nowcasting Events from the Social Web with Statistical Learning V Lampos, N Cristianini; ACM Transactions on Intelligent Systems and Technology (TIST) 3 (4), 72</span> </li> <li id="cite_note-49"><span class="mw-cite-backlink"><b><a href="#cite_ref-49">^</a></b></span> <span class="reference-text">NOAM: news outlets analysis and monitoring system; I Flaounas, O Ali, M Turchi, T Snowsill, F Nicart, T De Bie, N Cristianini Proc. of the 2011 ACM SIGMOD international conference on Management of data</span> </li> <li id="cite_note-50"><span class="mw-cite-backlink"><b><a href="#cite_ref-50">^</a></b></span> <span class="reference-text">Automatic discovery of patterns in media content, N Cristianini, Combinatorial Pattern Matching, 2-13, 2011</span> </li> <li id="cite_note-51"><span class="mw-cite-backlink"><b><a href="#cite_ref-51">^</a></b></span> <span class="reference-text">I. Flaounas, O. Ali, T. Lansdall-Welfare, T. De Bie, N. Mosdell, J. Lewis, N. Cristianini, RESEARCH METHODS IN THE AGE OF DIGITAL JOURNALISM, Digital Journalism, Routledge, 2012</span> </li> <li id="cite_note-52"><span class="mw-cite-backlink"><b><a href="#cite_ref-52">^</a></b></span> <span class="reference-text">Circadian Mood Variations in Twitter Content; Fabon Dzogang, Stafford Lightman, Nello Cristianini. Brain and Neuroscience Advances, 1, 2398212817744501.</span> </li> <li id="cite_note-53"><span class="mw-cite-backlink"><b><a href="#cite_ref-53">^</a></b></span> <span class="reference-text">Effects of the Recession on Public Mood in the UK; T Lansdall-Welfare, V Lampos, N Cristianini; Mining Social Network Dynamics (MSND) session on Social Media Applications</span> </li> <li id="cite_note-54"><span class="mw-cite-backlink"><b><a href="#cite_ref-54">^</a></b></span> <span class="reference-text"><a rel="nofollow" class="external text" href="http://www.out-law.com/en/articles/2014/june/researchers-given-data-mining-right-under-new-uk-copyright-laws/">Researchers given data mining right under new UK copyright laws</a> <a rel="nofollow" class="external text" href="https://web.archive.org/web/20140609020315/http://www.out-law.com/en/articles/2014/june/researchers-given-data-mining-right-under-new-uk-copyright-laws/">Archived</a> June 9, 2014, at the <a href="/wiki/Wayback_Machine" title="Wayback Machine">Wayback Machine</a></span> </li> <li id="cite_note-55"><span class="mw-cite-backlink"><b><a href="#cite_ref-55">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="http://ec.europa.eu/licences-for-europe-dialogue/en/content/about-site">"Licences for Europe – Structured Stakeholder Dialogue 2013"</a>. <i>European Commission</i><span class="reference-accessdate">. Retrieved <span class="nowrap">14 November</span> 2014</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=European+Commission&amp;rft.atitle=Licences+for+Europe+%E2%80%93+Structured+Stakeholder+Dialogue+2013&amp;rft_id=http%3A%2F%2Fec.europa.eu%2Flicences-for-europe-dialogue%2Fen%2Fcontent%2Fabout-site&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-56"><span class="mw-cite-backlink"><b><a href="#cite_ref-56">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://web.archive.org/web/20141129021244/http://libereurope.eu/news/text-and-data-mining-its-importance-and-the-need-for-change-in-europe/">"Text and Data Mining:Its importance and the need for change in Europe"</a>. <i><a href="/wiki/Association_of_European_Research_Libraries" title="Association of European Research Libraries">Association of European Research Libraries</a></i>. 2013-04-25. Archived from <a rel="nofollow" class="external text" href="http://libereurope.eu/news/text-and-data-mining-its-importance-and-the-need-for-change-in-europe/">the original</a> on 2014-11-29<span class="reference-accessdate">. Retrieved <span class="nowrap">14 November</span> 2014</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=Association+of+European+Research+Libraries&amp;rft.atitle=Text+and+Data+Mining%3AIts+importance+and+the+need+for+change+in+Europe&amp;rft.date=2013-04-25&amp;rft_id=http%3A%2F%2Flibereurope.eu%2Fnews%2Ftext-and-data-mining-its-importance-and-the-need-for-change-in-europe%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-57"><span class="mw-cite-backlink"><b><a href="#cite_ref-57">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation news cs1"><a rel="nofollow" class="external text" href="http://www.lexology.com/library/detail.aspx?g=a18c5b92-5a20-4d1d-a098-a3095046a88e">"Judge grants summary judgment in favor of Google Books – a fair use victory"</a>. <i>Lexology</i>. Antonelli Law Ltd. 19 November 2013<span class="reference-accessdate">. Retrieved <span class="nowrap">14 November</span> 2014</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=article&amp;rft.jtitle=Lexology&amp;rft.atitle=Judge+grants+summary+judgment+in+favor+of+Google+Books+%E2%80%93+a+fair+use+victory&amp;rft.date=2013-11-19&amp;rft_id=http%3A%2F%2Fwww.lexology.com%2Flibrary%2Fdetail.aspx%3Fg%3Da18c5b92-5a20-4d1d-a098-a3095046a88e&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> <li id="cite_note-58"><span class="mw-cite-backlink"><b><a href="#cite_ref-58">^</a></b></span> <span class="reference-text"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><cite class="citation web cs1"><a rel="nofollow" class="external text" href="https://www.alrc.gov.au/publication/copyright-and-the-digital-economy-dp-79/8-non-consumptive-use/text-and-data-mining/">"Text and data mining"</a>. <i><a href="/wiki/Australian_Law_Reform_Commission" title="Australian Law Reform Commission">Australian Law Reform Commission</a></i>. 4 June 2013<span class="reference-accessdate">. Retrieved <span class="nowrap">10 February</span> 2023</span>.</cite><span title="ctx_ver=Z39.88-2004&amp;rft_val_fmt=info%3Aofi%2Ffmt%3Akev%3Amtx%3Ajournal&amp;rft.genre=unknown&amp;rft.jtitle=Australian+Law+Reform+Commission&amp;rft.atitle=Text+and+data+mining&amp;rft.date=2013-06-04&amp;rft_id=https%3A%2F%2Fwww.alrc.gov.au%2Fpublication%2Fcopyright-and-the-digital-economy-dp-79%2F8-non-consumptive-use%2Ftext-and-data-mining%2F&amp;rfr_id=info%3Asid%2Fen.wikipedia.org%3AText+mining" class="Z3988"></span></span> </li> </ol></div></div> <div class="mw-heading mw-heading3"><h3 id="Sources">Sources</h3><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=22" title="Edit section: Sources"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <ul><li>Ananiadou, S. and McNaught, J. (Editors) (2006). <i>Text Mining for Biology and Biomedicine</i>. Artech House Books. <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&#160;<a href="/wiki/Special:BookSources/978-1-58053-984-5" title="Special:BookSources/978-1-58053-984-5">978-1-58053-984-5</a></li> <li>Bilisoly, R. (2008). <i>Practical Text Mining with Perl</i>. New York: John Wiley &amp; Sons. <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&#160;<a href="/wiki/Special:BookSources/978-0-470-17643-6" title="Special:BookSources/978-0-470-17643-6">978-0-470-17643-6</a></li> <li>Feldman, R., and Sanger, J. (2006). <i>The Text Mining Handbook</i>. New York: Cambridge University Press. <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&#160;<a href="/wiki/Special:BookSources/978-0-521-83657-9" title="Special:BookSources/978-0-521-83657-9">978-0-521-83657-9</a></li> <li>Hotho, A., Nürnberger, A. and Paaß, G. (2005). "A brief survey of text mining". In Ldv Forum, Vol. 20(1), p.&#160;19-62</li> <li>Indurkhya, N., and Damerau, F. (2010). <i>Handbook of Natural Language Processing</i>, 2nd Edition. Boca Raton, FL: CRC Press. <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&#160;<a href="/wiki/Special:BookSources/978-1-4200-8592-1" title="Special:BookSources/978-1-4200-8592-1">978-1-4200-8592-1</a></li> <li>Kao, A., and Poteet, S. (Editors). <i>Natural Language Processing and Text Mining</i>. Springer. <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&#160;<a href="/wiki/Special:BookSources/1-84628-175-X" title="Special:BookSources/1-84628-175-X">1-84628-175-X</a></li> <li>Konchady, M. <i>Text Mining Application Programming (Programming Series)</i>. Charles River Media. <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&#160;<a href="/wiki/Special:BookSources/1-58450-460-9" title="Special:BookSources/1-58450-460-9">1-58450-460-9</a></li> <li>Manning, C., and Schutze, H. (1999). <i>Foundations of Statistical Natural Language Processing</i>. Cambridge, MA: MIT Press. <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&#160;<a href="/wiki/Special:BookSources/978-0-262-13360-9" title="Special:BookSources/978-0-262-13360-9">978-0-262-13360-9</a></li> <li>Miner, G., Elder, J., Hill. T, Nisbet, R., Delen, D. and Fast, A. (2012). <i>Practical Text Mining and Statistical Analysis for Non-structured Text Data Applications</i>. Elsevier Academic Press. <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&#160;<a href="/wiki/Special:BookSources/978-0-12-386979-1" title="Special:BookSources/978-0-12-386979-1">978-0-12-386979-1</a></li> <li>McKnight, W. (2005). "Building business intelligence: Text data mining in business intelligence". <i>DM Review</i>, 21–22.</li> <li>Srivastava, A., and Sahami. M. (2009). <i>Text Mining: Classification, Clustering, and Applications</i>. Boca Raton, FL: CRC Press. <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&#160;<a href="/wiki/Special:BookSources/978-1-4200-5940-3" title="Special:BookSources/978-1-4200-5940-3">978-1-4200-5940-3</a></li> <li>Zanasi, A. (Editor) (2007). <i>Text Mining and its Applications to Intelligence, CRM and Knowledge Management</i>. WIT Press. <link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1238218222"><a href="/wiki/ISBN_(identifier)" class="mw-redirect" title="ISBN (identifier)">ISBN</a>&#160;<a href="/wiki/Special:BookSources/978-1-84564-131-3" title="Special:BookSources/978-1-84564-131-3">978-1-84564-131-3</a></li></ul> <div class="mw-heading mw-heading2"><h2 id="External_links">External links</h2><span class="mw-editsection"><span class="mw-editsection-bracket">[</span><a href="/w/index.php?title=Text_mining&amp;action=edit&amp;section=23" title="Edit section: External links"><span>edit</span></a><span class="mw-editsection-bracket">]</span></span></div> <ul><li><a rel="nofollow" class="external text" href="http://people.ischool.berkeley.edu/~hearst/text-mining.html">Marti Hearst: What Is Text Mining?</a> (October 2003)</li> <li><a rel="nofollow" class="external text" href="http://projects.ldc.upenn.edu/ace/">Automatic Content Extraction, Linguistic Data Consortium</a> <a rel="nofollow" class="external text" href="https://web.archive.org/web/20130925194420/http://projects.ldc.upenn.edu/ace/">Archived</a> 2013-09-25 at the <a href="/wiki/Wayback_Machine" title="Wayback Machine">Wayback Machine</a></li> <li><a rel="nofollow" class="external text" href="https://web.archive.org/web/20060308054306/http://www.itl.nist.gov/iad/894.01/tests/ace/">Automatic Content Extraction, NIST</a></li></ul> <div class="navbox-styles"><style data-mw-deduplicate="TemplateStyles:r1129693374">.mw-parser-output .hlist dl,.mw-parser-output .hlist ol,.mw-parser-output .hlist ul{margin:0;padding:0}.mw-parser-output .hlist dd,.mw-parser-output .hlist dt,.mw-parser-output .hlist li{margin:0;display:inline}.mw-parser-output .hlist.inline,.mw-parser-output .hlist.inline dl,.mw-parser-output .hlist.inline ol,.mw-parser-output .hlist.inline ul,.mw-parser-output .hlist dl dl,.mw-parser-output .hlist dl ol,.mw-parser-output .hlist dl ul,.mw-parser-output .hlist ol dl,.mw-parser-output .hlist ol ol,.mw-parser-output .hlist ol ul,.mw-parser-output .hlist ul dl,.mw-parser-output .hlist ul ol,.mw-parser-output .hlist ul ul{display:inline}.mw-parser-output .hlist .mw-empty-li{display:none}.mw-parser-output .hlist dt::after{content:": "}.mw-parser-output .hlist dd::after,.mw-parser-output .hlist li::after{content:" · ";font-weight:bold}.mw-parser-output .hlist dd:last-child::after,.mw-parser-output .hlist dt:last-child::after,.mw-parser-output .hlist li:last-child::after{content:none}.mw-parser-output .hlist dd dd:first-child::before,.mw-parser-output .hlist dd dt:first-child::before,.mw-parser-output .hlist dd li:first-child::before,.mw-parser-output .hlist dt dd:first-child::before,.mw-parser-output .hlist dt dt:first-child::before,.mw-parser-output .hlist dt li:first-child::before,.mw-parser-output .hlist li dd:first-child::before,.mw-parser-output .hlist li dt:first-child::before,.mw-parser-output .hlist li li:first-child::before{content:" (";font-weight:normal}.mw-parser-output .hlist dd dd:last-child::after,.mw-parser-output .hlist dd dt:last-child::after,.mw-parser-output .hlist dd li:last-child::after,.mw-parser-output .hlist dt dd:last-child::after,.mw-parser-output .hlist dt dt:last-child::after,.mw-parser-output .hlist dt li:last-child::after,.mw-parser-output .hlist li dd:last-child::after,.mw-parser-output .hlist li dt:last-child::after,.mw-parser-output .hlist li li:last-child::after{content:")";font-weight:normal}.mw-parser-output .hlist ol{counter-reset:listitem}.mw-parser-output .hlist ol>li{counter-increment:listitem}.mw-parser-output .hlist ol>li::before{content:" "counter(listitem)"\a0 "}.mw-parser-output .hlist dd ol>li:first-child::before,.mw-parser-output .hlist dt ol>li:first-child::before,.mw-parser-output .hlist li ol>li:first-child::before{content:" ("counter(listitem)"\a0 "}</style><style data-mw-deduplicate="TemplateStyles:r1236075235">.mw-parser-output .navbox{box-sizing:border-box;border:1px solid #a2a9b1;width:100%;clear:both;font-size:88%;text-align:center;padding:1px;margin:1em auto 0}.mw-parser-output .navbox .navbox{margin-top:0}.mw-parser-output .navbox+.navbox,.mw-parser-output .navbox+.navbox-styles+.navbox{margin-top:-1px}.mw-parser-output .navbox-inner,.mw-parser-output .navbox-subgroup{width:100%}.mw-parser-output .navbox-group,.mw-parser-output .navbox-title,.mw-parser-output .navbox-abovebelow{padding:0.25em 1em;line-height:1.5em;text-align:center}.mw-parser-output .navbox-group{white-space:nowrap;text-align:right}.mw-parser-output .navbox,.mw-parser-output .navbox-subgroup{background-color:#fdfdfd}.mw-parser-output .navbox-list{line-height:1.5em;border-color:#fdfdfd}.mw-parser-output .navbox-list-with-group{text-align:left;border-left-width:2px;border-left-style:solid}.mw-parser-output tr+tr>.navbox-abovebelow,.mw-parser-output tr+tr>.navbox-group,.mw-parser-output tr+tr>.navbox-image,.mw-parser-output tr+tr>.navbox-list{border-top:2px solid #fdfdfd}.mw-parser-output .navbox-title{background-color:#ccf}.mw-parser-output .navbox-abovebelow,.mw-parser-output .navbox-group,.mw-parser-output .navbox-subgroup .navbox-title{background-color:#ddf}.mw-parser-output .navbox-subgroup .navbox-group,.mw-parser-output .navbox-subgroup .navbox-abovebelow{background-color:#e6e6ff}.mw-parser-output .navbox-even{background-color:#f7f7f7}.mw-parser-output .navbox-odd{background-color:transparent}.mw-parser-output .navbox .hlist td dl,.mw-parser-output .navbox .hlist td ol,.mw-parser-output .navbox .hlist td ul,.mw-parser-output .navbox td.hlist dl,.mw-parser-output .navbox td.hlist ol,.mw-parser-output .navbox td.hlist ul{padding:0.125em 0}.mw-parser-output .navbox .navbar{display:block;font-size:100%}.mw-parser-output .navbox-title .navbar{float:left;text-align:left;margin-right:0.5em}body.skin--responsive .mw-parser-output .navbox-image img{max-width:none!important}@media print{body.ns-0 .mw-parser-output .navbox{display:none!important}}</style></div><div role="navigation" class="navbox" aria-labelledby="Natural_language_processing" style="padding:3px"><table class="nowraplinks hlist mw-collapsible autocollapse navbox-inner" style="border-spacing:0;background:transparent;color:inherit"><tbody><tr><th scope="col" class="navbox-title" colspan="2"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1129693374"><style data-mw-deduplicate="TemplateStyles:r1239400231">.mw-parser-output .navbar{display:inline;font-size:88%;font-weight:normal}.mw-parser-output .navbar-collapse{float:left;text-align:left}.mw-parser-output .navbar-boxtext{word-spacing:0}.mw-parser-output .navbar ul{display:inline-block;white-space:nowrap;line-height:inherit}.mw-parser-output .navbar-brackets::before{margin-right:-0.125em;content:"[ "}.mw-parser-output .navbar-brackets::after{margin-left:-0.125em;content:" ]"}.mw-parser-output .navbar li{word-spacing:-0.125em}.mw-parser-output .navbar a>span,.mw-parser-output .navbar a>abbr{text-decoration:inherit}.mw-parser-output .navbar-mini abbr{font-variant:small-caps;border-bottom:none;text-decoration:none;cursor:inherit}.mw-parser-output .navbar-ct-full{font-size:114%;margin:0 7em}.mw-parser-output .navbar-ct-mini{font-size:114%;margin:0 4em}html.skin-theme-clientpref-night .mw-parser-output .navbar li a abbr{color:var(--color-base)!important}@media(prefers-color-scheme:dark){html.skin-theme-clientpref-os .mw-parser-output .navbar li a abbr{color:var(--color-base)!important}}@media print{.mw-parser-output .navbar{display:none!important}}</style><div class="navbar plainlinks hlist navbar-mini"><ul><li class="nv-view"><a href="/wiki/Template:Natural_language_processing" title="Template:Natural language processing"><abbr title="View this template">v</abbr></a></li><li class="nv-talk"><a href="/wiki/Template_talk:Natural_language_processing" title="Template talk:Natural language processing"><abbr title="Discuss this template">t</abbr></a></li><li class="nv-edit"><a href="/wiki/Special:EditPage/Template:Natural_language_processing" title="Special:EditPage/Template:Natural language processing"><abbr title="Edit this template">e</abbr></a></li></ul></div><div id="Natural_language_processing" style="font-size:114%;margin:0 4em"><a href="/wiki/Natural_language_processing" title="Natural language processing">Natural language processing</a></div></th></tr><tr><th scope="row" class="navbox-group" style="width:1%">General terms</th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/AI-complete" title="AI-complete">AI-complete</a></li> <li><a href="/wiki/Bag-of-words_model" title="Bag-of-words model">Bag-of-words</a></li> <li><a href="/wiki/N-gram" title="N-gram">n-gram</a> <ul><li><a href="/wiki/Bigram" title="Bigram">Bigram</a></li> <li><a href="/wiki/Trigram" title="Trigram">Trigram</a></li></ul></li> <li><a href="/wiki/Computational_linguistics" title="Computational linguistics">Computational linguistics</a></li> <li><a href="/wiki/Natural_language_understanding" title="Natural language understanding">Natural language understanding</a></li> <li><a href="/wiki/Stop_word" title="Stop word">Stop words</a></li> <li><a href="/wiki/Text_processing" title="Text processing">Text processing</a></li></ul> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%"><a class="mw-selflink selflink">Text analysis</a></th><td class="navbox-list-with-group navbox-list navbox-even" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Argument_mining" title="Argument mining">Argument mining</a></li> <li><a href="/wiki/Collocation_extraction" title="Collocation extraction">Collocation extraction</a></li> <li><a href="/wiki/Concept_mining" title="Concept mining">Concept mining</a></li> <li><a href="/wiki/Coreference#Coreference_resolution" title="Coreference">Coreference resolution</a></li> <li><a href="/wiki/Deep_linguistic_processing" title="Deep linguistic processing">Deep linguistic processing</a></li> <li><a href="/wiki/Distant_reading" title="Distant reading">Distant reading</a></li> <li><a href="/wiki/Information_extraction" title="Information extraction">Information extraction</a></li> <li><a href="/wiki/Named-entity_recognition" title="Named-entity recognition">Named-entity recognition</a></li> <li><a href="/wiki/Ontology_learning" title="Ontology learning">Ontology learning</a></li> <li><a href="/wiki/Parsing" title="Parsing">Parsing</a> <ul><li><a href="/wiki/Semantic_parsing" title="Semantic parsing">Semantic parsing</a></li> <li><a href="/wiki/Syntactic_parsing_(computational_linguistics)" title="Syntactic parsing (computational linguistics)">Syntactic parsing</a></li></ul></li> <li><a href="/wiki/Part-of-speech_tagging" title="Part-of-speech tagging">Part-of-speech tagging</a></li> <li><a href="/wiki/Semantic_analysis_(machine_learning)" title="Semantic analysis (machine learning)">Semantic analysis</a></li> <li><a href="/wiki/Semantic_role_labeling" title="Semantic role labeling">Semantic role labeling</a></li> <li><a href="/wiki/Semantic_decomposition_(natural_language_processing)" title="Semantic decomposition (natural language processing)">Semantic decomposition</a></li> <li><a href="/wiki/Semantic_similarity" title="Semantic similarity">Semantic similarity</a></li> <li><a href="/wiki/Sentiment_analysis" title="Sentiment analysis">Sentiment analysis</a></li></ul> <ul><li><a href="/wiki/Terminology_extraction" title="Terminology extraction">Terminology extraction</a></li> <li><a class="mw-selflink selflink">Text mining</a></li> <li><a href="/wiki/Textual_entailment" title="Textual entailment">Textual entailment</a></li> <li><a href="/wiki/Truecasing" title="Truecasing">Truecasing</a></li> <li><a href="/wiki/Word-sense_disambiguation" title="Word-sense disambiguation">Word-sense disambiguation</a></li> <li><a href="/wiki/Word-sense_induction" title="Word-sense induction">Word-sense induction</a></li></ul> </div><table class="nowraplinks navbox-subgroup" style="border-spacing:0"><tbody><tr><th id="Text_segmentation" scope="row" class="navbox-group" style="width:1%"><a href="/wiki/Text_segmentation" title="Text segmentation">Text segmentation</a></th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Compound-term_processing" title="Compound-term processing">Compound-term processing</a></li> <li><a href="/wiki/Lemmatisation" class="mw-redirect" title="Lemmatisation">Lemmatisation</a></li> <li><a href="/wiki/Lexical_analysis" title="Lexical analysis">Lexical analysis</a></li> <li><a href="/wiki/Shallow_parsing" title="Shallow parsing">Text chunking</a></li> <li><a href="/wiki/Stemming" title="Stemming">Stemming</a></li> <li><a href="/wiki/Sentence_boundary_disambiguation" title="Sentence boundary disambiguation">Sentence segmentation</a></li> <li><a href="/wiki/Word#Word_boundaries" title="Word">Word segmentation</a></li></ul> </div></td></tr></tbody></table><div> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%"><a href="/wiki/Automatic_summarization" title="Automatic summarization">Automatic summarization</a></th><td class="navbox-list-with-group navbox-list navbox-even" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Multi-document_summarization" title="Multi-document summarization">Multi-document summarization</a></li> <li><a href="/wiki/Sentence_extraction" title="Sentence extraction">Sentence extraction</a></li> <li><a href="/wiki/Text_simplification" title="Text simplification">Text simplification</a></li></ul> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%"><a href="/wiki/Machine_translation" title="Machine translation">Machine translation</a></th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Computer-assisted_translation" title="Computer-assisted translation">Computer-assisted</a></li> <li><a href="/wiki/Example-based_machine_translation" title="Example-based machine translation">Example-based</a></li> <li><a href="/wiki/Rule-based_machine_translation" title="Rule-based machine translation">Rule-based</a></li> <li><a href="/wiki/Statistical_machine_translation" title="Statistical machine translation">Statistical</a></li> <li><a href="/wiki/Transfer-based_machine_translation" title="Transfer-based machine translation">Transfer-based</a></li> <li><a href="/wiki/Neural_machine_translation" title="Neural machine translation">Neural</a></li></ul> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%"><a href="/wiki/Distributional_semantics" title="Distributional semantics">Distributional semantics</a> models</th><td class="navbox-list-with-group navbox-list navbox-even" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/BERT_(language_model)" title="BERT (language model)">BERT</a></li> <li><a href="/wiki/Document-term_matrix" title="Document-term matrix">Document-term matrix</a></li> <li><a href="/wiki/Explicit_semantic_analysis" title="Explicit semantic analysis">Explicit semantic analysis</a></li> <li><a href="/wiki/FastText" title="FastText">fastText</a></li> <li><a href="/wiki/GloVe" title="GloVe">GloVe</a></li> <li><a href="/wiki/Language_model" title="Language model">Language model</a> (<a href="/wiki/Large_language_model" title="Large language model">large</a>)</li> <li><a href="/wiki/Latent_semantic_analysis" title="Latent semantic analysis">Latent semantic analysis</a></li> <li><a href="/wiki/Seq2seq" title="Seq2seq">Seq2seq</a></li> <li><a href="/wiki/Word_embedding" title="Word embedding">Word embedding</a></li> <li><a href="/wiki/Word2vec" title="Word2vec">Word2vec</a></li></ul> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%"><a href="/wiki/Language_resource" title="Language resource">Language resources</a>,<br />datasets and corpora</th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em"></div><table class="nowraplinks navbox-subgroup" style="border-spacing:0"><tbody><tr><th scope="row" class="navbox-group" style="width:1%">Types and<br />standards</th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Corpus_linguistics" title="Corpus linguistics">Corpus linguistics</a></li> <li><a href="/wiki/Lexical_resource" title="Lexical resource">Lexical resource</a></li> <li><a href="/wiki/Linguistic_Linked_Open_Data" title="Linguistic Linked Open Data">Linguistic Linked Open Data</a></li> <li><a href="/wiki/Machine-readable_dictionary" title="Machine-readable dictionary">Machine-readable dictionary</a></li> <li><a href="/wiki/Parallel_text" title="Parallel text">Parallel text</a></li> <li><a href="/wiki/PropBank" title="PropBank">PropBank</a></li> <li><a href="/wiki/Semantic_network" title="Semantic network">Semantic network</a></li> <li><a href="/wiki/Simple_Knowledge_Organization_System" title="Simple Knowledge Organization System">Simple Knowledge Organization System</a></li> <li><a href="/wiki/Speech_corpus" title="Speech corpus">Speech corpus</a></li> <li><a href="/wiki/Text_corpus" title="Text corpus">Text corpus</a></li> <li><a href="/wiki/Thesaurus_(information_retrieval)" title="Thesaurus (information retrieval)">Thesaurus (information retrieval)</a></li> <li><a href="/wiki/Treebank" title="Treebank">Treebank</a></li> <li><a href="/wiki/Universal_Dependencies" title="Universal Dependencies">Universal Dependencies</a></li></ul> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%">Data</th><td class="navbox-list-with-group navbox-list navbox-even" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/BabelNet" title="BabelNet">BabelNet</a></li> <li><a href="/wiki/Bank_of_English" title="Bank of English">Bank of English</a></li> <li><a href="/wiki/DBpedia" title="DBpedia">DBpedia</a></li> <li><a href="/wiki/FrameNet" title="FrameNet">FrameNet</a></li> <li><a href="/wiki/Google_Ngram_Viewer" class="mw-redirect" title="Google Ngram Viewer">Google Ngram Viewer</a></li> <li><a href="/wiki/UBY" title="UBY">UBY</a></li> <li><a href="/wiki/WordNet" title="WordNet">WordNet</a></li> <li><a href="/wiki/Wikidata" title="Wikidata">Wikidata</a></li></ul> </div></td></tr></tbody></table><div></div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%"><a href="/wiki/Automatic_identification_and_data_capture" title="Automatic identification and data capture">Automatic identification<br />and data capture</a></th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Speech_recognition" title="Speech recognition">Speech recognition</a></li> <li><a href="/wiki/Speech_segmentation" title="Speech segmentation">Speech segmentation</a></li> <li><a href="/wiki/Speech_synthesis" title="Speech synthesis">Speech synthesis</a></li> <li><a href="/wiki/Natural_language_generation" title="Natural language generation">Natural language generation</a></li> <li><a href="/wiki/Optical_character_recognition" title="Optical character recognition">Optical character recognition</a></li></ul> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%"><a href="/wiki/Topic_model" title="Topic model">Topic model</a></th><td class="navbox-list-with-group navbox-list navbox-even" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Document_classification" title="Document classification">Document classification</a></li> <li><a href="/wiki/Latent_Dirichlet_allocation" title="Latent Dirichlet allocation">Latent Dirichlet allocation</a></li> <li><a href="/wiki/Pachinko_allocation" title="Pachinko allocation">Pachinko allocation</a></li></ul> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%"><a href="/wiki/Computer-assisted_reviewing" title="Computer-assisted reviewing">Computer-assisted<br />reviewing</a></th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Automated_essay_scoring" title="Automated essay scoring">Automated essay scoring</a></li> <li><a href="/wiki/Concordancer" title="Concordancer">Concordancer</a></li> <li><a href="/wiki/Grammar_checker" title="Grammar checker">Grammar checker</a></li> <li><a href="/wiki/Predictive_text" title="Predictive text">Predictive text</a></li> <li><a href="/wiki/Pronunciation_assessment" title="Pronunciation assessment">Pronunciation assessment</a></li> <li><a href="/wiki/Spell_checker" title="Spell checker">Spell checker</a></li></ul> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%"><a href="/wiki/Natural-language_user_interface" title="Natural-language user interface">Natural language<br />user interface</a></th><td class="navbox-list-with-group navbox-list navbox-even" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Chatbot" title="Chatbot">Chatbot</a></li> <li><a href="/wiki/Interactive_fiction" title="Interactive fiction">Interactive fiction</a> (c.f. <a href="/wiki/Syntax_guessing" class="mw-redirect" title="Syntax guessing">Syntax guessing</a>)</li> <li><a href="/wiki/Question_answering" title="Question answering">Question answering</a></li> <li><a href="/wiki/Virtual_assistant" title="Virtual assistant">Virtual assistant</a></li> <li><a href="/wiki/Voice_user_interface" title="Voice user interface">Voice user interface</a></li></ul> </div></td></tr><tr><th scope="row" class="navbox-group" style="width:1%">Related</th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em"> <ul><li><a href="/wiki/Formal_semantics_(natural_language)" title="Formal semantics (natural language)">Formal semantics</a></li> <li><a href="/wiki/Hallucination_(artificial_intelligence)" title="Hallucination (artificial intelligence)">Hallucination</a></li> <li><a href="/wiki/Natural_Language_Toolkit" title="Natural Language Toolkit">Natural Language Toolkit</a></li> <li><a href="/wiki/SpaCy" title="SpaCy">spaCy</a></li></ul> </div></td></tr></tbody></table></div> <div class="navbox-styles"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1129693374"><link rel="mw-deduplicated-inline-style" href="mw-data:TemplateStyles:r1236075235"></div><div role="navigation" class="navbox authority-control" aria-label="Navbox" style="padding:3px"><table class="nowraplinks hlist navbox-inner" style="border-spacing:0;background:transparent;color:inherit"><tbody><tr><th scope="row" class="navbox-group" style="width:1%"><a href="/wiki/Help:Authority_control" title="Help:Authority control">Authority control databases</a>: National <span class="mw-valign-text-top noprint" typeof="mw:File/Frameless"><a href="https://www.wikidata.org/wiki/Q676880#identifiers" title="Edit this at Wikidata"><img alt="Edit this at Wikidata" src="//upload.wikimedia.org/wikipedia/en/thumb/8/8a/OOjs_UI_icon_edit-ltr-progressive.svg/10px-OOjs_UI_icon_edit-ltr-progressive.svg.png" decoding="async" width="10" height="10" class="mw-file-element" srcset="//upload.wikimedia.org/wikipedia/en/thumb/8/8a/OOjs_UI_icon_edit-ltr-progressive.svg/15px-OOjs_UI_icon_edit-ltr-progressive.svg.png 1.5x, //upload.wikimedia.org/wikipedia/en/thumb/8/8a/OOjs_UI_icon_edit-ltr-progressive.svg/20px-OOjs_UI_icon_edit-ltr-progressive.svg.png 2x" data-file-width="20" data-file-height="20" /></a></span></th><td class="navbox-list-with-group navbox-list navbox-odd" style="width:100%;padding:0"><div style="padding:0 0.25em"><ul><li><span class="uid"><a rel="nofollow" class="external text" href="https://id.ndl.go.jp/auth/ndlna/01119322">Japan</a></span></li><li><span class="uid"><a rel="nofollow" class="external text" href="https://kopkatalogs.lv/F?func=direct&amp;local_base=lnc10&amp;doc_number=000352119&amp;P_CON_LNG=ENG">Latvia</a></span></li><li><span class="uid"><a rel="nofollow" class="external text" href="http://olduli.nli.org.il/F/?func=find-b&amp;local_base=NLX10&amp;find_code=UID&amp;request=987008756687405171">Israel</a></span></li></ul></div></td></tr></tbody></table></div> <!-- NewPP limit report Parsed by mw‐web.codfw.main‐f69cdc8f6‐c2jr9 Cached time: 20241122141409 Cache expiry: 2592000 Reduced expiry: false Complications: [vary‐revision‐sha1, show‐toc] CPU time usage: 0.760 seconds Real time usage: 0.907 seconds Preprocessor visited node count: 5320/1000000 Post‐expand include size: 135581/2097152 bytes Template argument size: 2716/2097152 bytes Highest expansion depth: 14/100 Expensive parser function count: 5/500 Unstrip recursion depth: 1/20 Unstrip post‐expand size: 204722/5000000 bytes Lua time usage: 0.431/10.000 seconds Lua memory usage: 6102482/52428800 bytes Number of Wikibase entities loaded: 1/400 --> <!-- Transclusion expansion time report (%,ms,calls,template) 100.00% 730.514 1 -total 50.02% 365.418 1 Template:Reflist 18.66% 136.348 23 Template:Cite_journal 16.76% 122.418 11 Template:Cite_web 13.02% 95.137 1 Template:Natural_Language_Processing 12.89% 94.156 3 Template:Navbox 9.51% 69.459 1 Template:Short_description 9.13% 66.706 10 Template:ISBN 5.88% 42.941 2 Template:Pagetype 5.41% 39.500 10 Template:Catalog_lookup_link --> <!-- Saved in parser cache with key enwiki:pcache:idhash:318439-0!canonical and timestamp 20241122141409 and revision id 1251100761. Rendering was triggered because: page-view --> </div><!--esi <esi:include src="/esitest-fa8a495983347898/content" /> --><noscript><img src="https://login.wikimedia.org/wiki/Special:CentralAutoLogin/start?type=1x1" alt="" width="1" height="1" style="border: none; position: absolute;"></noscript> <div class="printfooter" data-nosnippet="">Retrieved from "<a dir="ltr" href="https://en.wikipedia.org/w/index.php?title=Text_mining&amp;oldid=1251100761">https://en.wikipedia.org/w/index.php?title=Text_mining&amp;oldid=1251100761</a>"</div></div> <div id="catlinks" class="catlinks" data-mw="interface"><div id="mw-normal-catlinks" class="mw-normal-catlinks"><a href="/wiki/Help:Category" title="Help:Category">Categories</a>: <ul><li><a href="/wiki/Category:Text_mining" title="Category:Text mining">Text mining</a></li><li><a href="/wiki/Category:Applied_data_mining" title="Category:Applied data mining">Applied data mining</a></li><li><a href="/wiki/Category:Computational_linguistics" title="Category:Computational linguistics">Computational linguistics</a></li><li><a href="/wiki/Category:Natural_language_processing" title="Category:Natural language processing">Natural language processing</a></li><li><a href="/wiki/Category:Statistical_natural_language_processing" title="Category:Statistical natural language processing">Statistical natural language processing</a></li><li><a href="/wiki/Category:Text" title="Category:Text">Text</a></li></ul></div><div id="mw-hidden-catlinks" class="mw-hidden-catlinks mw-hidden-cats-hidden">Hidden categories: <ul><li><a href="/wiki/Category:Webarchive_template_wayback_links" title="Category:Webarchive template wayback links">Webarchive template wayback links</a></li><li><a href="/wiki/Category:CS1_Portuguese-language_sources_(pt)" title="Category:CS1 Portuguese-language sources (pt)">CS1 Portuguese-language sources (pt)</a></li><li><a href="/wiki/Category:Articles_with_short_description" title="Category:Articles with short description">Articles with short description</a></li><li><a href="/wiki/Category:Short_description_matches_Wikidata" title="Category:Short description matches Wikidata">Short description matches Wikidata</a></li><li><a href="/wiki/Category:All_articles_with_unsourced_statements" title="Category:All articles with unsourced statements">All articles with unsourced statements</a></li><li><a href="/wiki/Category:Articles_with_unsourced_statements_from_October_2022" title="Category:Articles with unsourced statements from October 2022">Articles with unsourced statements from October 2022</a></li></ul></div></div> </div> </main> </div> <div class="mw-footer-container"> <footer id="footer" class="mw-footer" > <ul id="footer-info"> <li id="footer-info-lastmod"> This page was last edited on 14 October 2024, at 12:01<span class="anonymous-show">&#160;(UTC)</span>.</li> <li id="footer-info-copyright">Text is available under the <a href="/wiki/Wikipedia:Text_of_the_Creative_Commons_Attribution-ShareAlike_4.0_International_License" title="Wikipedia:Text of the Creative Commons Attribution-ShareAlike 4.0 International License">Creative Commons Attribution-ShareAlike 4.0 License</a>; additional terms may apply. By using this site, you agree to the <a href="https://foundation.wikimedia.org/wiki/Special:MyLanguage/Policy:Terms_of_Use" class="extiw" title="foundation:Special:MyLanguage/Policy:Terms of Use">Terms of Use</a> and <a href="https://foundation.wikimedia.org/wiki/Special:MyLanguage/Policy:Privacy_policy" class="extiw" title="foundation:Special:MyLanguage/Policy:Privacy policy">Privacy Policy</a>. Wikipedia® is a registered trademark of the <a rel="nofollow" class="external text" href="https://wikimediafoundation.org/">Wikimedia Foundation, Inc.</a>, a non-profit organization.</li> </ul> <ul id="footer-places"> <li id="footer-places-privacy"><a href="https://foundation.wikimedia.org/wiki/Special:MyLanguage/Policy:Privacy_policy">Privacy policy</a></li> <li id="footer-places-about"><a href="/wiki/Wikipedia:About">About Wikipedia</a></li> <li id="footer-places-disclaimers"><a href="/wiki/Wikipedia:General_disclaimer">Disclaimers</a></li> <li id="footer-places-contact"><a href="//en.wikipedia.org/wiki/Wikipedia:Contact_us">Contact Wikipedia</a></li> <li id="footer-places-wm-codeofconduct"><a href="https://foundation.wikimedia.org/wiki/Special:MyLanguage/Policy:Universal_Code_of_Conduct">Code of Conduct</a></li> <li id="footer-places-developers"><a href="https://developer.wikimedia.org">Developers</a></li> <li id="footer-places-statslink"><a href="https://stats.wikimedia.org/#/en.wikipedia.org">Statistics</a></li> <li id="footer-places-cookiestatement"><a href="https://foundation.wikimedia.org/wiki/Special:MyLanguage/Policy:Cookie_statement">Cookie statement</a></li> <li id="footer-places-mobileview"><a href="//en.m.wikipedia.org/w/index.php?title=Text_mining&amp;mobileaction=toggle_view_mobile" class="noprint stopMobileRedirectToggle">Mobile view</a></li> </ul> <ul id="footer-icons" class="noprint"> <li id="footer-copyrightico"><a href="https://wikimediafoundation.org/" class="cdx-button cdx-button--fake-button cdx-button--size-large cdx-button--fake-button--enabled"><img src="/static/images/footer/wikimedia-button.svg" width="84" height="29" alt="Wikimedia Foundation" loading="lazy"></a></li> <li id="footer-poweredbyico"><a href="https://www.mediawiki.org/" class="cdx-button cdx-button--fake-button cdx-button--size-large cdx-button--fake-button--enabled"><img src="/w/resources/assets/poweredby_mediawiki.svg" alt="Powered by MediaWiki" width="88" height="31" loading="lazy"></a></li> </ul> </footer> </div> </div> </div> <div class="vector-settings" id="p-dock-bottom"> <ul></ul> </div><script>(RLQ=window.RLQ||[]).push(function(){mw.config.set({"wgHostname":"mw-web.codfw.main-f69cdc8f6-zntss","wgBackendResponseTime":167,"wgPageParseReport":{"limitreport":{"cputime":"0.760","walltime":"0.907","ppvisitednodes":{"value":5320,"limit":1000000},"postexpandincludesize":{"value":135581,"limit":2097152},"templateargumentsize":{"value":2716,"limit":2097152},"expansiondepth":{"value":14,"limit":100},"expensivefunctioncount":{"value":5,"limit":500},"unstrip-depth":{"value":1,"limit":20},"unstrip-size":{"value":204722,"limit":5000000},"entityaccesscount":{"value":1,"limit":400},"timingprofile":["100.00% 730.514 1 -total"," 50.02% 365.418 1 Template:Reflist"," 18.66% 136.348 23 Template:Cite_journal"," 16.76% 122.418 11 Template:Cite_web"," 13.02% 95.137 1 Template:Natural_Language_Processing"," 12.89% 94.156 3 Template:Navbox"," 9.51% 69.459 1 Template:Short_description"," 9.13% 66.706 10 Template:ISBN"," 5.88% 42.941 2 Template:Pagetype"," 5.41% 39.500 10 Template:Catalog_lookup_link"]},"scribunto":{"limitreport-timeusage":{"value":"0.431","limit":"10.000"},"limitreport-memusage":{"value":6102482,"limit":52428800}},"cachereport":{"origin":"mw-web.codfw.main-f69cdc8f6-c2jr9","timestamp":"20241122141409","ttl":2592000,"transientcontent":false}}});});</script> <script type="application/ld+json">{"@context":"https:\/\/schema.org","@type":"Article","name":"Text mining","url":"https:\/\/en.wikipedia.org\/wiki\/Text_mining","sameAs":"http:\/\/www.wikidata.org\/entity\/Q676880","mainEntity":"http:\/\/www.wikidata.org\/entity\/Q676880","author":{"@type":"Organization","name":"Contributors to Wikimedia projects"},"publisher":{"@type":"Organization","name":"Wikimedia Foundation, Inc.","logo":{"@type":"ImageObject","url":"https:\/\/www.wikimedia.org\/static\/images\/wmf-hor-googpub.png"}},"datePublished":"2003-09-14T18:19:41Z","dateModified":"2024-10-14T12:01:01Z","headline":"process of analysing text to extract information from it"}</script> </body> </html>

Pages: 1 2 3 4 5 6 7 8 9 10