CINXE.COM

Information Retrieval - Ryte Wiki - The Digital Marketing Wiki

<!DOCTYPE html> <html class="client-nojs" lang="en" dir="ltr"> <head> <meta charset="UTF-8"/> <title>Information Retrieval - Ryte Wiki - The Digital Marketing Wiki</title> <script>document.documentElement.className="client-js";RLCONF={"wgBreakFrames":!1,"wgSeparatorTransformTable":["",""],"wgDigitTransformTable":["",""],"wgDefaultDateFormat":"dmy","wgMonthNames":["","January","February","March","April","May","June","July","August","September","October","November","December"],"wgRequestId":"93deff5e658771e1b1ffcbd9","wgCSPNonce":!1,"wgCanonicalNamespace":"","wgCanonicalSpecialPageName":!1,"wgNamespaceNumber":0,"wgPageName":"Information_Retrieval","wgTitle":"Information Retrieval","wgCurRevisionId":3021,"wgRevisionId":3021,"wgArticleId":481,"wgIsArticle":!0,"wgIsRedirect":!1,"wgAction":"view","wgUserName":null,"wgUserGroups":["*"],"wgCategories":["Search Engine Optimization"],"wgPageContentLanguage":"en","wgPageContentModel":"wikitext","wgRelevantPageName":"Information_Retrieval","wgRelevantArticleId":481,"wgIsProbablyEditable":!1,"wgRelevantPageIsProbablyEditable":!1,"wgRestrictionEdit":[],"wgRestrictionMove":[],"wgVisualEditor":{ "pageLanguageCode":"en","pageLanguageDir":"ltr","pageVariantFallbacks":"en"},"wgRelatedArticles":["Google Inc."],"wgFlaggedRevsParams":{"tags":{"accuracy":{"levels":1,"quality":1,"pristine":2}}},"wgStableRevisionId":3021,"bsgMaxUploadSize":{"php":536870912,"mediawiki":104857600},"bsgEnableUploads":!0,"bsgFileExtensions":["txt","rtf","doc","dot","docx","dotx","dotm","xls","xlt","xlm","xlsx","xlsm","xltm","xltx","ppt","pot","pps","pptx","pptm","potx","potm","ppsx","ppsm","sldx","sldm","odt","fodt","ods","fods","odp","fodp","pdf","zip","rar","tar","tgz","gz","bzip2","7zip","xml","svg"],"bsgImageExtensions":["png","gif","jpg","jpeg"],"bsgIsWindows":!1,"bsgArticlePreviewCaptureNotDefault":!1,"bsMaxUploadSize":{"php":536870912,"mediawiki":104857600},"bsEnableUploads":!0,"bsFileExtensions":["txt","rtf","doc","dot","docx","dotx","dotm","xls","xlt","xlm","xlsx","xlsm","xltm","xltx","ppt","pot","pps","pptx","pptm","potx","potm","ppsx","ppsm","sldx","sldm","odt","fodt","ods","fods", "odp","fodp","pdf","zip","rar","tar","tgz","gz","bzip2","7zip","xml","svg"],"bsImageExtensions":["png","gif","jpg","jpeg"],"bsIsWindows":!1,"bsArticlePreviewCaptureNotDefault":!1,"wgEditSubmitButtonLabelPublish":!1,"bsgDeferredNotifications":[]};RLSTATE={"site.styles":"ready","noscript":"ready","user.styles":"ready","user":"ready","user.options":"loading","ext.flaggedRevs.icons":"ready","oojs-ui-core.styles":"ready","oojs-ui.styles.indicators":"ready","mediawiki.widgets.styles":"ready","oojs-ui-core.icons":"ready","mediawiki.toc.styles":"ready","ext.bluespice.styles":"ready","ext.bluespice.compat.vector.styles":"ready","ext.visualEditor.desktopArticleTarget.noscript":"ready","ext.flaggedRevs.basic":"ready","bluespice.flaggedRevsConnector.styles":"ready","skin.ryte.styles":"ready"};RLPAGEMODULES=["site","mediawiki.page.startup","mediawiki.page.ready","mediawiki.toc","ext.bluespice","ext.visualEditor.desktopArticleTarget.init","ext.visualEditor.targetLoader", "ext.relatedArticles.readMore.bootstrap","ext.flaggedRevs.advanced","bluespice.flaggedRevsConnector.js","skin.ryte.scripts","ext.bootstrap.scripts"];</script> <script>(RLQ=window.RLQ||[]).push(function(){mw.loader.implement("user.options@1hzgi",function($,jQuery,require,module){/*@nomin*/mw.user.tokens.set({"patrolToken":"+\\","watchToken":"+\\","csrfToken":"+\\"}); });});</script> <link rel="stylesheet" href="/wiki/load.php?lang=en&amp;modules=bluespice.flaggedRevsConnector.styles%7Cext.bluespice.compat.vector.styles%7Cext.bluespice.styles%7Cext.flaggedRevs.basic%2Cicons%7Cext.visualEditor.desktopArticleTarget.noscript%7Cmediawiki.toc.styles%7Cmediawiki.widgets.styles%7Coojs-ui-core.icons%2Cstyles%7Coojs-ui.styles.indicators%7Cskin.ryte.styles&amp;only=styles&amp;skin=ryteskin"/> <script async="" src="/wiki/load.php?lang=en&amp;modules=startup&amp;only=scripts&amp;raw=1&amp;skin=ryteskin"></script> <meta name="ResourceLoaderDynamicStyles" content=""/> <link rel="stylesheet" href="/wiki/load.php?lang=en&amp;modules=site.styles&amp;only=styles&amp;skin=ryteskin"/> <meta name="generator" content="MediaWiki 1.35.2"/> <meta name="viewport" content="width=device-width, initial-scale=1.0"/> <link rel="alternate" hreflang="de" href="https://de.ryte.com/wiki/Information_Retrieval"/> <link rel="alternate" hreflang="en" href="https://en.ryte.com/wiki/Information_Retrieval"/> <link rel="apple-touch-icon" href="/wiki/skins/RyteSkin/resources/images/favicon-32x32.png"/> <link rel="shortcut icon" href="/wiki/extensions/BlueSpiceFoundation/resources/bluespice/images/favicon.ico"/> <link rel="search" type="application/opensearchdescription+xml" href="/wiki/opensearch_desc.php" title="Ryte Wiki - The Digital Marketing Wiki (en)"/> <link rel="EditURI" type="application/rsd+xml" href="https://en.ryte.com/wiki/api.php?action=rsd"/> <link rel="canonical" href="https://en.ryte.com/wiki/Information_Retrieval"/> <script id="usercentrics-cmp" data-settings-id="iYESBWoLK" src="https://app.usercentrics.eu/browser-ui/latest/bundle.js" async=""></script> <!--[if lt IE 9]><script src="/wiki/resources/lib/html5shiv/html5shiv.js"></script><![endif]--> </head> <body class="mediawiki ltr sitedir-ltr mw-hide-empty-elt ns-0 ns-subject page-Information_Retrieval rootpage-Information_Retrieval layout-ryte skin-ryteskin action-view bs-contentpage"><div id="topmenu"><div><a id="logo" href="/wiki/Main_Page"><img src="/wiki/skins/RyteSkin/resources/images/Ryte_Logo_Wiki.svg" alt="Ryte Wiki"/></a><ul class="navi"><li><form id="searchform2" action="https://en.ryte.com/wiki/Special:Search" class="searchform" role="search"><input id ="searchInput" name="search" placeholder="Search" accesskey="f" type="search" autocomplete="off" maxlength="50" ><input id="mw-searchButton" class="searchsubmit" name="fulltext" type="submit" value=""/></form></li><li class="dropdown_menu bs-dropdown-hover dropdown"><a class="dropdown-toggle" data-toggle="dropdown">Categories<svg xmlns="http://www.w3.org/2000/svg" width="14" height="14" viewbox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round"><polyline points="6 9 12 15 18 9"></polyline></svg></a><div class="dropdown-menu"><a href="https://en.ryte.com/wiki/Category:Online_Marketing">Online Marketing</a><a href="https://en.ryte.com/wiki/Category:Search_Engine_Optimization">Search Engine Optimization</a><a href="https://en.ryte.com/wiki/Category:Social_Media">Social Media</a><a href="https://en.ryte.com/wiki/Category:Usability">Usability</a><a href="https://en.ryte.com/wiki/Category:Mobile_Marketing">Mobile Marketing</a><a href="https://en.ryte.com/wiki/Category:Web_Analysis">Web Analysis</a><a href="https://en.ryte.com/wiki/Category:Development">Development</a></div></li><li class=""><a href="/">ryte.com</a></li></ul><div class="nav_mobile"><svg class="open_menu" version="1.1" xmlns="http://www.w3.org/2000/svg" width="20" height="16" viewbox="0 0 16 16"><rect class="st0 topmenu-svg-btn" width="20" height="2"></rect><rect y="6" class="st0 topmenu-svg-btn" width="20" height="2"></rect><rect y="12" class="st0 topmenu-svg-btn" width="20" height="2"></rect></svg><svg class="close_menu" xmlns="http://www.w3.org/2000/svg" width="20" height="16" viewbox="0 0 20 16"><polygon class="st0 topmenu-svg-btn" points="15.6 1.4 14.1 0 7.8 6.4 1.4 0 0 1.4 6.4 7.8 0 14.1 1.4 15.6 7.8 9.2 14.1 15.6 15.6 14.1 9.2 7.8 15.6 1.4"></polygon></svg></div></div></div><div id="inletaside_wrapper" class="_bg_gray inletasidewrapper"><aside id="aside"><h2 class="bs-sidebar-section" style="display: block">Page approval</h2><div class="frc-cnt stable" data-state="stable" data-user-can-review="false"><span class="frc-state">State: Approved</span></div><h2 class="bs-sidebar-section">Main page</h2><ul><li><a href="https://en.ryte.com/wiki/Main_Page">Homepage</a></li></ul><h2 class="bs-sidebar-section">Contact</h2><ul><li><a href="mailto:editorial@ryte.com">See a topic that's missing? <br >Send us an email!</a></li></ul><h2 class="bs-sidebar-section">Learn more</h2><ul><li><a href="https://en.ryte.com/magazine/">Discover the Ryte Magazine</a></li></ul><h2 class="bs-sidebar-section">Other languages</h2><ul><li><a href="https://de.ryte.com/wiki/Information_Retrieval">Deutsch</a></li></ul><form id="newslform" class="newsl_form" action="https://en.ryte.com/register/free-trial/" method="post" style="visibility: visible;"><div><p class="wikiheads">Optimize your website with Ryte!</p><input id ="website" name="prefilled_url" placeholder="http://" type="text" required="required" ><input type="submit" name="submit" class="button green_bt" value="Start your free trial"/></div></form></aside><div class="_inlet"><div class="_spacer"><div id="content" class="mw-body" role="main"><div id="siteNotice"><div id="mwstake-alert-container"><div class="alert alert-success" role="alert" data-mwstake-alert-id="bs-flaggedrevsconnector-revisionstate">This version is approved.</div></div></div><h1 id="firstHeading" class="firstHeading">Information Retrieval</h1><div id="mw-page-header-links"></div><div class="visualClear"></div><div id="bodyContent" class="mw-body-content"><div class="skyscraper"><div class="sidebox" id="sidebox"><div class="newsocials sideboxsocials center"><div class="share_wrap clear"><a class="bt_share share_fb" href="http://www.facebook.com/sharer.php?u=https://en.ryte.com/wiki/Information_Retrieval">share</a><a class="bt_share share_tw" href="http://twitter.com/intent/tweet?related=Ryte&amp;text=&amp;url=https://en.ryte.com/wiki/Information_Retrieval&amp;via=Ryte_DE&amp;lang=de">tweet</a><a class="bt_share share_li" href="https://www.linkedin.com/shareArticle?mini=true&amp;url=https://en.ryte.com/wiki/Information_Retrieval&amp;title=">share</a></div></div></div></div><div id="contentSub"></div><div></div><div id="mw-content-text" lang="en" dir="ltr" class="mw-content-ltr"><div class="mw-parser-output"><p><br /> In information retrieval, unstructured data is evaluated similar to what search engines do with the World Wide Web. </p> <div id="toc" class="toc" role="navigation" aria-labelledby="mw-toc-heading"><input type="checkbox" role="button" id="toctogglecheckbox" class="toctogglecheckbox" style="display:none" /><div class="toctitle" lang="en" dir="ltr"><h2 id="mw-toc-heading">Contents</h2><span class="toctogglespan"><label class="toctogglelabel" for="toctogglecheckbox"></label></span></div> <ul> <li class="toclevel-1 tocsection-1"><a href="#Main_principle"><span class="tocnumber">1</span> <span class="toctext">Main principle</span></a></li> <li class="toclevel-1 tocsection-2"><a href="#Areas_of_application"><span class="tocnumber">2</span> <span class="toctext">Areas of application</span></a></li> <li class="toclevel-1 tocsection-3"><a href="#Difficulties"><span class="tocnumber">3</span> <span class="toctext">Difficulties</span></a></li> <li class="toclevel-1 tocsection-4"><a href="#Models"><span class="tocnumber">4</span> <span class="toctext">Models</span></a> <ul> <li class="toclevel-2 tocsection-5"><a href="#Boolean_model"><span class="tocnumber">4.1</span> <span class="toctext">Boolean model</span></a></li> <li class="toclevel-2 tocsection-6"><a href="#Vector_space_model"><span class="tocnumber">4.2</span> <span class="toctext">Vector space model</span></a></li> <li class="toclevel-2 tocsection-7"><a href="#Probabilistic_model"><span class="tocnumber">4.3</span> <span class="toctext">Probabilistic model</span></a></li> </ul> </li> </ul> </div> <h2><span class="mw-headline" id="Main_principle">Main principle</span></h2> <p>It is based on a large amount of data. For example, information about a particular topic needs to be found. For this purpose, the amount of data needs to be searched and the data found must be assessed as to whether it is important information and if certain information is more important than other information found. There is no clear answer for all this and there is no perfect order for the data to be delivered as a result. The evaluation of the data is supposed to be useful for humans. It’s not about recreating data, but managing existing data. Large amounts of data are searched for, not individual words. </p> <h2><span class="mw-headline" id="Areas_of_application">Areas of application</span></h2> <p>Currently, the largest area of ​​application is the Internet search, whereby search engines such as <a href="/wiki/Google_Inc." title="Google Inc." data-bs-title="Google_Inc.">Google</a> or <a href="/wiki/Bing" title="Bing" data-bs-title="Bing">Bing</a> search the data of the Internet based on desired words (search requests). The searcher is provided a results list of relevant webpages which contain information with regard to the entered search term. Search results that are not relevant to the user, but still appear on the <a href="/wiki/SERP" title="SERP" data-bs-title="SERP">SERPs</a> are called false drops. Moreover, information retrieval is used when searching for literature in digital libraries, in image search engines, and spam filters. </p> <h2><span class="mw-headline" id="Difficulties">Difficulties</span></h2> <p>Users can usually only enter very vague requests. They often also do not know exactly what they are looking for. It is also uncertain if the information is correct, for example, because a word has different meanings or there are synonyms that mean the same thing. </p> <h2><span class="mw-headline" id="Models">Models</span></h2> <p>There are different models for <a href="/wiki/Indexing" title="Indexing" data-bs-title="Indexing">indexing</a> of found documents which do not exclude each other as a rule. The aim is to present many relevant documents and to omit those which are not relevant. </p> <h3><span class="mw-headline" id="Boolean_model">Boolean model</span></h3> <p>Based on Boolean algebra, requests with exact syntax are posed with Boolean operators such as "and", "or", "not" etc. This is quite easy and a clear. The disadvantage is that partial results and weighting of terms are not possible. Thus, the result is not a ranking, because a document is either relevant or not. </p> <h3><span class="mw-headline" id="Vector_space_model">Vector space model</span></h3> <p>A model, often used by search engines, is the vector space model, since both ranking and a similarity search will be taken into account. A document is transformed into a vector and in this format can be compared to other documents or the search request. The vectors can be sorted according to their similarity to the search request. The downside of this model is that Boolean operators cannot be used and terms cannot be excluded. Terms, term frequency, and IDF are used in this model. The location of the documents in the vector space is calculated through these. </p> <h3><span class="mw-headline" id="Probabilistic_model">Probabilistic model</span></h3> <p>This model specifies a probability value for each document to determine whether it is a relevant result. In this case, the number of occurrences of the search terms in the document is critical. The result is a list that is sorted according to the probabilities. This model is no better than others and is hardly used in practice. </p> <!-- NewPP limit report Cached time: 20250217122125 Cache expiry: 86400 Dynamic content: false Complications: [] CPU time usage: 0.003 seconds Real time usage: 0.006 seconds Preprocessor visited node count: 26/1000000 Post‐expand include size: 0/2097152 bytes Template argument size: 0/2097152 bytes Highest expansion depth: 2/40 Expensive parser function count: 0/100 Unstrip recursion depth: 0/20 Unstrip post‐expand size: 0/5000000 bytes --> <!-- Transclusion expansion time report (%,ms,calls,template) 100.00% 0.000 1 -total --> </div><div class="loader-indicator global loading"><div class="loader-indicator-inner"></div></div></div><div class="printfooter"> Retrieved from "<a dir="ltr" href="https://en.ryte.com/wiki/index.php?title=Information_Retrieval&amp;oldid=3021">https://en.ryte.com/wiki/index.php?title=Information_Retrieval&amp;oldid=3021</a>"</div> <div class="visualClear"></div></div><div class="ryte-content-category-list"><h2 class="mw-headline">Category</h2><ul><li><a href="/wiki/Category:Search_Engine_Optimization" title="Category:Search Engine Optimization" data-bs-title="Category:Search_Engine_Optimization">Search Engine Optimization</a></li></div></div><div id='mw-data-after-content'> <div class="read-more-container"></div> </div> </div></div></div><footer class="imprint_lnks center"><a href="/about/tou/">Terms of use</a> | <a href="/about/privacy/">Privacy</a> | <a href="/about/tos/">Terms and conditions</a> | <a href="/about/imprint/">Imprint</a><br>Copyright © 2021 Ryte</footer> <script type="text/plain" data-usercentrics="Google Tag Manager">(function (w, d, s, l, i) { w[l] = w[l] || []; w[l].push({ 'gtm.start': new Date().getTime(), event: 'gtm.js' }); var f = d.getElementsByTagName(s)[0], j = d.createElement(s), dl = l != 'dataLayer' ? '&l=' + l : ''; j.async = true; j.src = '//www.googletagmanager.com/gtm.js?id=' + i + dl; f.parentNode.insertBefore(j, f); })(window, document, 'script', 'dataLayer', 'GTM-NP734B');</script> <script>(RLQ=window.RLQ||[]).push(function(){mw.config.set({"wgPageParseReport":{"limitreport":{"cputime":"0.003","walltime":"0.006","ppvisitednodes":{"value":26,"limit":1000000},"postexpandincludesize":{"value":0,"limit":2097152},"templateargumentsize":{"value":0,"limit":2097152},"expansiondepth":{"value":2,"limit":40},"expensivefunctioncount":{"value":0,"limit":100},"unstrip-depth":{"value":0,"limit":20},"unstrip-size":{"value":0,"limit":5000000},"timingprofile":["100.00% 0.000 1 -total"]},"cachereport":{"timestamp":"20250217122125","ttl":86400,"transientcontent":false}}});mw.config.set({"wgBackendResponseTime":291});});</script></body> </html>

Pages: 1 2 3 4 5 6 7 8 9 10