CINXE.COM
Technorati Weblog: Rolling out the new crawler
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd"> <html xmlns="http://www.w3.org/1999/xhtml"> <head profile="http://gmpg.org/xfn/11"><script type="text/javascript" src="/_static/js/bundle-playback.js?v=HxkREWBo" charset="utf-8"></script> <script type="text/javascript" src="/_static/js/wombat.js?v=txqj7nKC" charset="utf-8"></script> <script>window.RufflePlayer=window.RufflePlayer||{};window.RufflePlayer.config={"autoplay":"on","unmuteOverlay":"hidden"};</script> <script type="text/javascript" src="/_static/js/ruffle/ruffle.js"></script> <script type="text/javascript"> __wm.init("http://web.archive.org/web"); __wm.wombat("http://technorati.com:80/weblog/2009/02/473.html","20090221150230","http://web.archive.org/","web","/_static/", "1235228550"); </script> <link rel="stylesheet" type="text/css" href="/_static/css/banner-styles.css?v=S1zqJCYt" /> <link rel="stylesheet" type="text/css" href="/_static/css/iconochive.css?v=3PDvdIFv" /> <!-- End Wayback Rewrite JS Include --> <meta http-equiv="Content-Type" content="text/html; charset=utf-8"/> <title>Technorati Weblog: Rolling out the new crawler</title> <link href="http://web.archive.org/web/20090221150230cs_/http://static.technorati.com/static/css/global.css" rel="stylesheet" type="text/css"/> <link href="http://web.archive.org/web/20090221150230cs_/http://static.technorati.com/static/css/technorati.css" rel="stylesheet" type="text/css"/> <link href="http://web.archive.org/web/20090221150230cs_/http://static.technorati.com/static/css/content.css" rel="stylesheet" type="text/css"/> <link href="http://web.archive.org/web/20090221150230cs_/http://static.technorati.com/static/css/section-weblog.css" rel="stylesheet" type="text/css"/> <script src="http://web.archive.org/web/20090221150230js_/http://static.technorati.com/static/js/base.js" type="text/javascript"></script> <script src="http://web.archive.org/web/20090221150230js_/http://static.technorati.com/static/js/global.js" type="text/javascript"></script> <link rel="alternate" hreflang="ja" href="http://web.archive.org/web/20090221150230/http://www.technorati.jp/" title="Technorati Japan"/> <link rel="search" type="application/opensearchdescription+xml" href="http://web.archive.org/web/20090221150230/http://technorati.com/osd.xml" title="Technorati Search"/> <link rel="copyright" href="#copyright"/> </head> <body id="technorati"> <div class="tracking"> <!-- Begin pageImpression --> <script type="text/javascript"> var zzt=new Image(); zzt.src="http://web.archive.org/web/20090221150230/http://static.technorati.com/z/5040473824.gif?anM9MSZyZWY9LSZ2aXNpdG9yaWQ9NjcuMjAyLjU0LjE5MS4xMjM1MjI4MzA4ODAwNDY5JnVzZXJpZD0tJnNlc3Npb25pZD0tJnVzZXJjbGFzcz0tJmFiY2xhc3M9LSZhYnN3aXRjaD0tJm1lbWJlcj0tJnNlc3Npb25zdGFydHRpbWU9MTIzNTIyODU0OSZzZXNzaW9uZHVyYXRpb249LSZ2aXNpdGNvdW50PTEmdmlzaXRzdGFydHRpbWU9MTIzNTIyODU0OSZ2aXNpdGR1cmF0aW9uPS0mdmlzaXRwYWdlY291bnQ9MSZuZXdiaWVmbGFnPTAmYXV0aG9yaXplZD0wJmJsb2djbGFpbXM9MA=="; </script> <noscript> <div><img width="1" height="1" alt="" src="http://web.archive.org/web/20090221150230im_/http://static.technorati.com/z/5040473824.gif?anM9MCZyZWY9LSZ2aXNpdG9yaWQ9NjcuMjAyLjU0LjE5MS4xMjM1MjI4MzA4ODAwNDY5JnVzZXJpZD0tJnNlc3Npb25pZD0tJnVzZXJjbGFzcz0tJmFiY2xhc3M9LSZhYnN3aXRjaD0tJm1lbWJlcj0tJnNlc3Npb25zdGFydHRpbWU9MTIzNTIyODU0OSZzZXNzaW9uZHVyYXRpb249LSZ2aXNpdGNvdW50PTEmdmlzaXRzdGFydHRpbWU9MTIzNTIyODU0OSZ2aXNpdGR1cmF0aW9uPS0mdmlzaXRwYWdlY291bnQ9MSZuZXdiaWVmbGFnPTAmYXV0aG9yaXplZD0wJmJsb2djbGFpbXM9MA=="/></div> </noscript> <!-- End pageImpression --> <!-- Start Quantcast --> <script type="text/javascript" src="http://web.archive.org/web/20090221150230js_/http://edge.quantserve.com/quant.js"></script> <script type="text/javascript"> _qoptions = { tags:"tri.weblog" }; _qacct="p-6cp0NSw2i2sSA";quantserve();</script> <noscript><div><a href="http://web.archive.org/web/20090221150230/http://www.quantcast.com/p-6cp0NSw2i2sSA"><img src="http://web.archive.org/web/20090221150230im_/http://pixel.quantserve.com/pixel/p-6cp0NSw2i2sSA.gif?tags=tri.weblog" height="1" width="1" alt=""/></a></div></noscript> <!-- End Quantcast --> <script type="text/javascript"> var gaJsHost = (("https:" == document.location.protocol) ? "http://web.archive.org/web/20090221150230/https://ssl." : "http://web.archive.org/web/20090221150230/http://www."); document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E")); </script> <script type="text/javascript"> var pageTracker = _gat._getTracker("UA-4781905-1"); pageTracker._initData(); </script> </div> <div id="container"> <div id="banner-ad" class="ad"> <div class="doubleclick"> <!-- Begin DoubleClick Ad --> <script type="text/javascript"> <!-- document.write('<script type="text/javascript" src="http://web.archive.org/web/20090221150230/http://ad.doubleclick.net/adj/tri.weblog;tile=1;pos=top;ad=rb;member=0;sz=728x90;ord=8567286017350852?" type="text/javascript"></scr' + 'ipt>'); //--> </script> <noscript><div><a href="http://web.archive.org/web/20090221150230/http://ad.doubleclick.net/jump/tri.weblog;tile=1;pos=top;ad=rb;member=0;sz=728x90;ord=8567286017350852"><img src="http://web.archive.org/web/20090221150230im_/http://ad.doubleclick.net/ad/tri.weblog;tile=1;pos=top;ad=rb;member=0;sz=728x90;ord=8567286017350852" width="728" height="90" alt=""/></a></div></noscript> <!-- End DoubleClick Ad --> </div> </div> <div id="header-channels"> <span>Explore Technorati:</span> <a rel="nofollow" onclick="pageTracker._trackEvent('Header Channels', 'Click Explore - Technology');" href="/web/20090221150230/http://technorati.com/technology/">Technology</a> / <a rel="nofollow" onclick="pageTracker._trackEvent('Header Channels', 'Click Explore - Business');" href="/web/20090221150230/http://technorati.com/business/">Business</a> / <a rel="nofollow" onclick="pageTracker._trackEvent('Header Channels', 'Click Explore - Entertainment');" href="/web/20090221150230/http://technorati.com/entertainment/">Entertainment</a> / <a rel="nofollow" onclick="pageTracker._trackEvent('Header Channels', 'Click Explore - Lifestyle');" href="/web/20090221150230/http://technorati.com/lifestyle/">Lifestyle</a> / <a rel="nofollow" onclick="pageTracker._trackEvent('Header Channels', 'Click Explore - Politics');" href="/web/20090221150230/http://technorati.com/politics/">Politics</a> / <a rel="nofollow" onclick="pageTracker._trackEvent('Header Channels', 'Click Explore - Sports');" href="/web/20090221150230/http://technorati.com/sports/">Sports</a> / <a rel="nofollow" onclick="pageTracker._trackEvent('Header Channels', 'Click Explore - Gadgets');" href="/web/20090221150230/http://technorati.com/technology/gadgets/">Gadgets</a> / <a rel="nofollow" onclick="pageTracker._trackEvent('Header Channels', 'Click Explore - Celebrity');" href="/web/20090221150230/http://technorati.com/entertainment/celebrity/">Celebrity</a> / <a rel="nofollow" onclick="pageTracker._trackEvent('Header Channels', 'Click Explore - IT');" href="/web/20090221150230/http://technorati.com/technology/it/">IT</a> / <a rel="nofollow" onclick="pageTracker._trackEvent('Header Channels', 'Click Explore - Film');" href="/web/20090221150230/http://technorati.com/entertainment/film/">Film</a> / <a rel="nofollow" onclick="pageTracker._trackEvent('Header Channels', 'Click Explore - Music');" href="/web/20090221150230/http://technorati.com/entertainment/music/">Music</a> / <a rel="nofollow" onclick="pageTracker._trackEvent('Header Channels', 'Click Explore - Finance');" href="/web/20090221150230/http://technorati.com/business/finance/">Finance</a> / <a rel="nofollow" onclick="pageTracker._trackEvent('Header Channels', 'Click Explore - Advertising');" href="/web/20090221150230/http://technorati.com/business/advertising/">Advertising</a> </div> <div id="header"><div id="header-inner"> <a id="logo" href="/web/20090221150230/http://technorati.com/">Technorati</a> <form id="search" action="/web/20090221150230/http://technorati.com/query.php" method="post"> <div> <label for="q">search the blogosphere…</label> <input type="text" id="q" name="q" value=""/> <input class="submit" type="image" src="http://web.archive.org/web/20090221150230im_/http://static.technorati.com/static/images/global/search-submit.png" alt="Go"/> <a href="/web/20090221150230/http://technorati.com/search?advanced">advanced</a> </div> </form> <ul id="account"> <li><a id="join-link" href="/web/20090221150230/http://technorati.com/account/signup/?destination=/weblog/2009/02/473.html">Join</a></li> <li><a id="_please-pardon-this-crappy-hack_sign-in-link" href="/web/20090221150230/http://technorati.com/account/signup/?destination=/weblog/2009/02/473.html">Sign in</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/">Help</a></li> </ul> </div></div> <div id="nav" onclick="$(this).track('/nav');"><div id="nav-inner"> <ul> <li id="channels-menu" onclick="$(this).track('channels');" class="complex-menu featured"> <a href="" onclick="$(this).track('menu');">Channels</a> <ul class="dropdown"> <li class="dropdown-promo"> <a href="/web/20090221150230/http://technorati.com/lifestyle/travel/" onclick="$(this).track('/promo/editorial/nav-channel/20090219');">Travel: people still on the go despite economy and accidents.</a> </li> <li class="complex-li first-block"> <h3><a href="/web/20090221150230/http://technorati.com/business/" onclick="$(this).track('business');">Business</a></h3> <ul> <li><a href="/web/20090221150230/http://technorati.com/business/advertising/" onclick="$(this).track('advertising');">Advertising</a></li> <li><a href="/web/20090221150230/http://technorati.com/business/finance/" onclick="$(this).track('finance');">Finance</a></li> <li><a href="/web/20090221150230/http://technorati.com/business/small-business/" onclick="$(this).track('smallbusiness');">Small Business</a></li> </ul> </li> <li class="complex-li second-block"> <h3><a href="/web/20090221150230/http://technorati.com/entertainment/" onclick="$(this).track('entertainment');">Entertainment</a></h3> <ul> <li><a href="/web/20090221150230/http://technorati.com/entertainment/celebrity/" onclick="$(this).track('celebrity');">Celebrity</a></li> <li><a href="/web/20090221150230/http://technorati.com/entertainment/film/" onclick="$(this).track('film');">Film</a></li> <li><a href="/web/20090221150230/http://technorati.com/entertainment/gaming/" onclick="$(this).track('gaming');">Gaming</a></li> <li><a href="/web/20090221150230/http://technorati.com/entertainment/indie-film/" onclick="$(this).track('indiefilm');">Indie Film</a></li> <li><a href="/web/20090221150230/http://technorati.com/entertainment/music/" onclick="$(this).track('music');">Music</a></li> <li><a href="/web/20090221150230/http://technorati.com/entertainment/tv/" onclick="$(this).track('tv');">TV</a></li> </ul> </li> <li class="complex-li third-block"> <h3><a href="/web/20090221150230/http://technorati.com/lifestyle/" onclick="$(this).track('lifestyle');">Lifestyle</a></h3> <ul> <li><a href="/web/20090221150230/http://technorati.com/lifestyle/autos/" onclick="$(this).track('autos');">Autos</a></li> <li><a href="/web/20090221150230/http://technorati.com/lifestyle/family/" onclick="$(this).track('family');">Family</a></li> <li><a href="/web/20090221150230/http://technorati.com/lifestyle/green/" onclick="$(this).track('green');">Green</a></li> <li><a href="/web/20090221150230/http://technorati.com/lifestyle/travel/" onclick="$(this).track('travel');">Travel</a></li> </ul> </li> <li class="complex-li fourth-block"> <h3><a href="/web/20090221150230/http://technorati.com/politics/" onclick="$(this).track('politics');">Politics</a></h3> <ul> <li><a href="/web/20090221150230/http://technorati.com/politics/election-2008/" onclick="$(this).track('election2008');">Election 2008</a></li> </ul> </li> <li class="complex-li fifth-block"> <h3><a href="/web/20090221150230/http://technorati.com/sports/" onclick="$(this).track('sports');">Sports</a></h3> <ul> <li><a href="/web/20090221150230/http://technorati.com/sports/baseball/" onclick="$(this).track('baseball');">Baseball</a></li> <li><a href="/web/20090221150230/http://technorati.com/sports/football/" onclick="$(this).track('football');">Football</a></li> <li><a href="/web/20090221150230/http://technorati.com/sports/green/" onclick="$(this).track('olympics');">Olympics</a></li> </ul> </li> <li class="complex-li sixth-block"> <h3><a href="/web/20090221150230/http://technorati.com/technology/" onclick="$(this).track('technology');">Technology</a></h3> <ul> <li><a href="/web/20090221150230/http://technorati.com/technology/gadgets/" onclick="$(this).track('gadgets');">Gadgets</a></li> <li><a href="/web/20090221150230/http://technorati.com/technology/it/" onclick="$(this).track('it');">IT</a></li> </ul> </li> </ul> </li> <li id="blogs-menu" onclick="$(this).track('blogs');" class=" "> <a href="/web/20090221150230/http://technorati.com/blogs/directory/" onclick="$(this).track('menu');">Blogs</a> <ul class="dropdown"> <li> <h3><a href="/web/20090221150230/http://technorati.com/blogs/directory/" onclick="$(this).track('blogdirectory');">Blog Directory</a></h3> </li> <li> <h3><a href="/web/20090221150230/http://technorati.com/pop/blogs/" onclick="$(this).track('top100blogs');">Top 100 Blogs</a></h3> </li> <li> <h3><a href="/web/20090221150230/http://technorati.com/weblog/" onclick="$(this).track('technoratiblog');">Technorati Blog</a></h3> </li> </ul> </li> <li id="photos-menu" class="no-subitems"><a href="/web/20090221150230/http://technorati.com/photos/" onclick="$(this).track('photos');">Photos</a></li> <li id="videos-menu" class="no-subitems"><a href="/web/20090221150230/http://technorati.com/videos/" onclick="$(this).track('videos');">Videos</a></li> <li id="favorites-menu" onclick="$(this).track('favorites');" class=" "> <a href="/web/20090221150230/http://technorati.com/faves/" onclick="$(this).track('menu');">Favorites</a> <ul class="dropdown"> <li> <h3><a href="/web/20090221150230/http://technorati.com/faves/" onclick="$(this).track('favorites');">Favorites</a></h3> </li> <li> <h3><a href="/web/20090221150230/http://technorati.com/watchlist/" onclick="$(this).track('watchlists');">Watchlists</a></h3> </li> </ul> </li> <li id="popular-menu" onclick="$(this).track('popular');" class=" "> <a href="/web/20090221150230/http://technorati.com/pop/" onclick="$(this).track('menu');">Popular</a> <ul class="dropdown"> <li> <h3><a href="/web/20090221150230/http://technorati.com/pop/" onclick="$(this).track('whatspopular');">What's Popular</a></h3> </li> <li> <h3><a href="/web/20090221150230/http://technorati.com/tag/" onclick="$(this).track('populartags');">Popular Tags</a></h3> </li> <li> <h3><a href="/web/20090221150230/http://technorati.com/pop/youtube/" onclick="$(this).track('popularvideos');">Popular Videos</a></h3> </li> <li> <h3><a href="/web/20090221150230/http://technorati.com/pop/movies/" onclick="$(this).track('popularmovies');">Popular Movies</a></h3> </li> <li> <h3><a href="/web/20090221150230/http://technorati.com/pop/news/" onclick="$(this).track('popularnews');">Popular News</a></h3> </li> <li> <h3><a href="/web/20090221150230/http://technorati.com/pop/music/" onclick="$(this).track('popularmusic');">Popular Music</a></h3> </li> <li> <h3><a href="/web/20090221150230/http://technorati.com/pop/games/" onclick="$(this).track('populargames');">Popular Games</a></h3> </li> <li> <h3><a href="/web/20090221150230/http://technorati.com/pop/dvds/" onclick="$(this).track('populardvds');">Popular DVDs</a></h3> </li> <li> <h3><a href="/web/20090221150230/http://technorati.com/pop/books/" onclick="$(this).track('popularbooks');">Popular Books</a></h3> </li> </ul> </li> <li id="bloggercentral-menu" onclick="$(this).track('bloggercentral');" class=" "> <a href="/web/20090221150230/http://technorati.com/blogging/" onclick="$(this).track('menu');">Blogger Central</a> <ul class="dropdown"> <li> <h3><a href="/web/20090221150230/http://technorati.com/blogging/" onclick="$(this).track('bloggercentral');">Blogger Central</a></h3> </li> <li> <h3><a href="/web/20090221150230/http://technorati.com/blogging/state-of-the-blogosphere/" onclick="$(this).track('sob');">State of the Blogosphere</a></h3> </li> <li> <h3><a href="/web/20090221150230/http://technorati.com/ping/" onclick="$(this).track('ping');">Ping Your Blog</a></h3> </li> <li> <h3><a href="/web/20090221150230/http://technorati.com/account/claims/" onclick="$(this).track('claimyourblog');">Claim Your Blog</a></h3> </li> <li> <h3><a href="/web/20090221150230/http://technorati.com/widgets/" onclick="$(this).track('widgets');">Widgets</a></h3> </li> <li> <h3><a href="/web/20090221150230/http://technorati.com/chart/" onclick="$(this).track('chart');">Charts</a></h3> </li> <li> <h3><a href="/web/20090221150230/http://technorati.com/developers/" onclick="$(this).track('developers');">Developers</a></h3> </li> </ul> </li> <li id="support-menu" onclick="$(this).track('support');" class=" "> <a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/" onclick="$(this).track('menu');">Support</a> <ul class="dropdown"> <li> <h3><a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/" onclick="$(this).track('support-home');">Support Home</a></h3> </li> <li> <h3><a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/blog/" onclick="$(this).track('sitestatus');">Site Status</a></h3> </li> <li> <h3><a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/guidelines/" onclick="$(this).track('blogquality');">Blog Quality</a></h3> </li> <li> <h3><a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/faq/" onclick="$(this).track('topfaqs');">Top FAQs</a></h3> <li> <ul class=""> <li><a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/faq/topic/87" onclick="$(this).track('what');">What does Claiming my blog do?</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/faq/topic/34" onclick="$(this).track('how');">How do I get indexed?</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/faq/topic/47" onclick="$(this).track('whattag');">What is a Tag?</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/faq/topic/71" onclick="$(this).track('whatauthority');">What is Authority?</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/faq/topic/60" onclick="$(this).track('howspam');">How do I report Spam?</a></li> </ul> </li> </li> <li> <h3><a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/support/siteguide/" onclick="$(this).track('siteguide');">Site Guide</a></h3> <li> <ul class=""> <li><a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/support/siteguide/" onclick="$(this).track('bloggingbasics');">Blogging Basics</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/support/siteguide/search/" onclick="$(this).track('sg-search');">Search</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/support/siteguide/tags/" onclick="$(this).track('sg-tags');">Tags</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/support/siteguide/directory/" onclick="$(this).track('sg-blogs');">Blogs</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/support/siteguide/photos/" onclick="$(this).track('sg-photos');">Photos</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/support/siteguide/videos/" onclick="$(this).track('sg-videos');">Videos</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/support/siteguide/faves/" onclick="$(this).track('sg-favorites');">Favorites</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/support/siteguide/channels/" onclick="$(this).track('sg-channels');">Channels</a></li> </ul> </li> </li> <li> <h3><a href="http://web.archive.org/web/20090221150230/http://support.technorati.com/discussions/" onclick="$(this).track('supportforum');">Support Forum</a></h3> </li> </ul> </li> <li id="navigation-promo" class="no-subitems"><a onclick="$(this).track('/promo/editorial/nav/20090219');" href="/web/20090221150230/http://technorati.com/pop/music/">Music: New Springsteen talk of Blogosphere</a></li> </ul> </div></div> <script>initNavigation();</script> <div id="content"><div id="content-inner"> <div id="main" class="content"> <div id="technoblog"> <div class="entry"> <div class="entry_info"> <div class="inner"> <h3>Rolling out the new crawler</h3> <img class="photo" src="/web/20090221150230im_/http://technorati.com/static/img/staff/dorion_carroll.jpg" alt="Dorion Carroll"/><h4 class="byline">Posted by <cite class="vcard"><a href="http://web.archive.org/web/20090221150230/http://technorati.com/about/staff.html?s=dorion_carroll" class="fn">Dorion Carroll</a></cite> on February 7, 2009</h4> <p> <span class="tags">Category: <a href="http://web.archive.org/web/20090221150230/http://technorati.com/weblog/blogging" rel="tag" title="Technorati Weblog posts about: Blogging">Blogging</a></span> <span class="permalink"><a href="http://web.archive.org/web/20090221150230/http://technorati.com/weblog/2009/02/473.html">Permalink</a> · <script src="http://web.archive.org/web/20090221150230js_/http://embed.technorati.com/linkcount" type="text/javascript"></script> <a href="http://web.archive.org/web/20090221150230/http://technorati.com/search/http%3A%2F%2Ftechnorati.com%2Fweblog%2F2009%2F02%2F473.html?sub=nscosmos" rel="linkcount">View blog reactions</a> </span> </p> </div> </div> <div class="entry_body"> <p>Over the last six months we've been working on a rewrite of our blog crawling infrastructure from the ground up. Sometimes it seems like blogs are like fingerprints, no two are alike. With a new architectural approach, we've added a lot better coverage of many new blogging conventions, better visibility and tracking of what is happening in the internals of the crawler, and how to do a better job of recognizing all the great content bloggers are discussing and linking to.</p> <p>The time has come to retire the original Technorati crawler. Most blogs from the larger platforms have been using the new crawler for a few months and we're now ready to convert the rest of the blogs in our index.</p> <p>We've been moving large portions of blogs during the past two weeks and still have a lot to go. The large scale shift has put some strain on our crawl queues and data management systems during this wave of updates. The big push has resulted in slower times to index than usual. We're working hard to keep the new posts coming in and expect the majority of the backlog to be sorted out during this next week. We appreciate your patience. I think you'll like the results when everything is converted.</p> <p>Keep on blogging. The Crawler Development Team.</p> </div> </div> <div id="pages" class="box"> <a href="http://web.archive.org/web/20090221150230/http://technorati.com/weblog/2009/02/472.html" title="Previous post">« We鈥檙e Launching Original Tag Articles and Blurbs on Technorati.com</a> <b class="cn tl"></b> <b class="cn tr"></b> <b class="cn br"></b> <b class="cn bl"></b> </div> </div> </div> <div id="extra"> <div class="sponsor"> <div class="doubleclick"> <!-- Begin DoubleClick Ad --> <script type="text/javascript"> <!-- document.write('<script type="text/javascript" src="http://web.archive.org/web/20090221150230/http://ad.doubleclick.net/adj/tri.bloggercentral/weblog;ad=rb;member=0;sz=300x60;ord=8567286017350852?" type="text/javascript"></scr' + 'ipt>'); //--> </script> <noscript><div><a href="http://web.archive.org/web/20090221150230/http://ad.doubleclick.net/jump/tri.bloggercentral/weblog;ad=rb;member=0;sz=300x60;ord=8567286017350852"><img src="http://web.archive.org/web/20090221150230im_/http://ad.doubleclick.net/ad/tri.bloggercentral/weblog;ad=rb;member=0;sz=300x60;ord=8567286017350852" width="300" height="60" alt=""/></a></div></noscript> <!-- End DoubleClick Ad --> </div> </div> <div class="ad module"> <div class="doubleclick"> <!-- Begin DoubleClick Ad --> <script type="text/javascript"> <!-- document.write('<script type="text/javascript" src="http://web.archive.org/web/20090221150230/http://ad.doubleclick.net/adj/tri.bloggercentral/weblog;tile=2;pos=top;ad=rb;member=0;sz=300x250;ord=8567286017350852?" type="text/javascript"></scr' + 'ipt>'); //--> </script> <noscript><div><a href="http://web.archive.org/web/20090221150230/http://ad.doubleclick.net/jump/tri.bloggercentral/weblog;tile=2;pos=top;ad=rb;member=0;sz=300x250;ord=8567286017350852"><img src="http://web.archive.org/web/20090221150230im_/http://ad.doubleclick.net/ad/tri.bloggercentral/weblog;tile=2;pos=top;ad=rb;member=0;sz=300x250;ord=8567286017350852" width="300" height="250" alt=""/></a></div></noscript> <!-- End DoubleClick Ad --> </div> </div> <div id="blogarchives"> <div id="weblog_searches"> <div class="inner"> <div id="technorati_search"> <form action="/web/20090221150230/http://technorati.com/search.php" class="search" method="post"> <input type="text" id="bsearch" name="s" value="" class="label" onblur="if(this.value ==''){this.className='label';this.value='Search this blog';}" onfocus="if(this.value=='Search this blog'){this.className='';this.value='';}"/> <script type="text/javascript"> $e('bsearch').value = "Search this blog"; </script> <input type="submit" class="btn" value="Search"/> <input type="hidden" name="from" value="http://technorati.com/weblog/"/> </form> </div> <h2>View Archived Posts</h2> <form id="archivemonth" action="#"> <p> <label for="montharchive">by month</label> <select name="select1" id="montharchive" onchange="surfto(this.form)"> <option selected="selected" value="/">Select Month</option> <option value="http://technorati.com/weblog/2009/02/">February 2009</option> <option value="http://technorati.com/weblog/2009/01/">January 2009</option> <option value="http://technorati.com/weblog/2008/12/">December 2008</option> <option value="http://technorati.com/weblog/2008/11/">November 2008</option> <option value="http://technorati.com/weblog/2008/10/">October 2008</option> <option value="http://technorati.com/weblog/2008/09/">September 2008</option> <option value="http://technorati.com/weblog/2008/08/">August 2008</option> <option value="http://technorati.com/weblog/2008/06/">June 2008</option> <option value="http://technorati.com/weblog/2008/05/">May 2008</option> <option value="http://technorati.com/weblog/2008/04/">April 2008</option> <option value="http://technorati.com/weblog/2008/02/">February 2008</option> <option value="http://technorati.com/weblog/2008/01/">January 2008</option> <option value="http://technorati.com/weblog/2007/12/">December 2007</option> <option value="http://technorati.com/weblog/2007/11/">November 2007</option> <option value="http://technorati.com/weblog/2007/10/">October 2007</option> <option value="http://technorati.com/weblog/2007/09/">September 2007</option> <option value="http://technorati.com/weblog/2007/08/">August 2007</option> <option value="http://technorati.com/weblog/2007/07/">July 2007</option> <option value="http://technorati.com/weblog/2007/06/">June 2007</option> <option value="http://technorati.com/weblog/2007/05/">May 2007</option> <option value="http://technorati.com/weblog/2007/04/">April 2007</option> <option value="http://technorati.com/weblog/2007/03/">March 2007</option> <option value="http://technorati.com/weblog/2007/02/">February 2007</option> <option value="http://technorati.com/weblog/2007/01/">January 2007</option> <option value="http://technorati.com/weblog/2006/12/">December 2006</option> <option value="http://technorati.com/weblog/2006/11/">November 2006</option> <option value="http://technorati.com/weblog/2006/10/">October 2006</option> <option value="http://technorati.com/weblog/2006/09/">September 2006</option> <option value="http://technorati.com/weblog/2006/08/">August 2006</option> <option value="http://technorati.com/weblog/2006/07/">July 2006</option> <option value="http://technorati.com/weblog/2006/05/">May 2006</option> <option value="http://technorati.com/weblog/2006/04/">April 2006</option> <option value="http://technorati.com/weblog/2006/02/">February 2006</option> <option value="http://technorati.com/weblog/2006/01/">January 2006</option> <option value="http://technorati.com/weblog/2005/12/">December 2005</option> <option value="http://technorati.com/weblog/2005/11/">November 2005</option> <option value="http://technorati.com/weblog/2005/10/">October 2005</option> <option value="http://technorati.com/weblog/2005/09/">September 2005</option> <option value="http://technorati.com/weblog/2005/08/">August 2005</option> <option value="http://technorati.com/weblog/2005/07/">July 2005</option> <option value="http://technorati.com/weblog/2005/06/">June 2005</option> <option value="http://technorati.com/weblog/2005/05/">May 2005</option> </select> </p> </form> <form id="archivetags" action="#"> <p> <label for="tagarchive">by category</label> <select id="tagarchive" name="select1" onchange="surfto(this.form)"> <option selected="selected" value="/">Select Category</option> <option value="http://technorati.com/weblog/blogging/">Blogging</option> <option value="http://technorati.com/weblog/blogosphere/">Blogosphere</option> <option value="http://technorati.com/weblog/contests/">Contests</option> <option value="http://technorati.com/weblog/events/">Events</option> <option value="http://technorati.com/weblog/favorites/">Favorites</option> <option value="http://technorati.com/weblog/pop_culture/">Pop Culture</option> <option value="http://technorati.com/weblog/technorati_news/">Technorati News</option> <option value="http://technorati.com/weblog/world_news/">World News</option> <option value="http://technorati.com/weblog/widgets/">widgets</option> </select> </p> </form> </div> </div> <div id="recent_titles"> <h2>Recent posts</h2> <ol> <li><a href="http://web.archive.org/web/20090221150230/http://technorati.com/weblog/2009/02/473.html">Rolling out the new crawler</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://technorati.com/weblog/2009/02/472.html">We鈥檙e Launching Original Tag Articles and Blurbs on Technorati.com</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://technorati.com/weblog/2009/02/471.html">Trust</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://technorati.com/weblog/2009/01/469.html">We鈥檝e Got Web 2.0 Passes to Give Away</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://technorati.com/weblog/2009/01/466.html">Welcome To The Blogosphere, Mr. President</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://technorati.com/weblog/2009/01/465.html">Liveblog the Inauguration with BlogCritics</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://technorati.com/weblog/2009/01/464.html">Technorati.com Network Test - January 16, 2009</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://technorati.com/weblog/2009/01/463.html">If You're in Chicago, a Social Media Conference Well Worth Attending</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://technorati.com/weblog/2008/12/460.html">Scheduled Maintenance, Monday, December 22, 2008</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://technorati.com/weblog/2008/12/457.html">Some Upgrades to Technorati.com</a></li> </ol> </div><!-- <form id="searchall" method="get" action="http://technorati.com/cosmos/search.html"> <p> <label for="wlsearchall">Search all blogs:</label> <input type="hidden" name="sub" value="searchlet" /> <input id="wlsearchall" size="15" type="text" name="url" maxlength="255" value="" /> <input type="submit" value="Search" style="font-size: 10px; font-weight: bold;" /> </p> </form> --> </div> <div class="ad module technorati-engage"><!--- SCRIPT ID: 47260 --> <script> var zoneIdentifier = 'B99B951A9928BB0F'; var varCheckURL = (("https:" == document.location.protocol) ? "https://" : "http://"); document.write(unescape("%3Cscript src='" + varCheckURL + "adcode.technoratimedia.com/bootstrap/tti.js' type='text/javascript'%3E%3C/script%3E")); </script> </div> </div> <div style="clear: both;"></div> <div id="content-bottom-corners"></div> </div></div> </div> <div id="footer" class="wide-rounded"><div class="wide-rounded-inner" onclick="$(this).track('/footer');"> <div class="promo"> <ul> <li class="promo-item"> <h2 class="channel"><a href="/web/20090221150230/http://technorati.com/tag/" onclick="$(this).track('/promo/editorial/footer-left/20090219');">Tag Pages</a> 禄</h2> <div><a href="/web/20090221150230/http://technorati.com/tag/oscars" style="float: left; margin: 0 5px 20px 0; border: none;" onclick="$(this).track('/promo/editorial/footer-left/20090219');"><img style="display:block" src="http://web.archive.org/web/20090221150230im_/http://static.technorati.com/static/images/promos/20090219/kate-winslet-46x46.png" width="46" height="46" alt="Kate Winslet"/></a></div> <p><a href="/web/20090221150230/http://technorati.com/tag/oscars" onclick="$(this).track('/promo/editorial/footer-left/20090219');" rel="nofollow">Oscars</a>: will Slumdog Milk awards, or will Button remove all Doubt?</p> </li> <li class="promo-item second-promo"> <h2 class="channel"><a href="/web/20090221150230/http://technorati.com/blogs/directory/" onclick="$(this).track('/promo/editorial/footer-left-middle/20090219');">Blogs</a> 禄</h2> <div><a href="/web/20090221150230/http://technorati.com/blogs/www.talkingpointsmemo.com" style="float: left; margin: 0 5px 20px 0; border: none;" onclick="$(this).track('/promo/editorial/footer-left-middle/20090219');"><img style="display:block" src="http://web.archive.org/web/20090221150230im_/http://static.technorati.com/static/images/promos/20090219/josh-marshall-46x46.png" width="46" height="46" alt="Josh Marshall"/></a></div> <p>Washington from the left: <a href="/web/20090221150230/http://technorati.com/blogs/www.talkingpointsmemo.com" onclick="$(this).track('/promo/editorial/footer-left-middle/20090219');" rel="nofollow">Talking Points Memo</a>.</p> </li> <li> <div class="channel"><h2><a href="/web/20090221150230/http://technorati.com/photos/" onclick="$(this).track('/promo/footer-photos/text-link');">Today in Photos</a> »</h2></div> <a id="photos-anchor" href="/web/20090221150230/http://technorati.com/photos/" onclick="$(this).track('/promo/footer-photos/image-link');"><img src="http://web.archive.org/web/20090221150230im_/http://static.technorati.com/asset/img/collage_212x92.jpg" width="212" height="92" alt="Photos from popular blog posts"/></a> </li> <li class="partner"> <h2 class="channel">Technorati Media Partner »</h2> <p>Visit these great blogs in our network:</p> <ul> <li><h3><a class="external" href="http://web.archive.org/web/20090221150230/http://icanhascheezburger.com/" onclick="$(this).track('/promo/footer-media-partner/first-link');">I Can Has Cheezburger?</a></h3></li> <li><h3><a class="external" href="http://web.archive.org/web/20090221150230/http://tcritic.com/" onclick="$(this).track('/promo/footer-media-partner/second-link');">Tcritic</a></h3></li> <li><h3><a class="external" href="http://web.archive.org/web/20090221150230/http://nerdapproved.com/" onclick="$(this).track('/promo/footer-media-partner/third-link');">NerdApproved</a></h3></li> </ul> <div class="logo"><a href="http://web.archive.org/web/20090221150230/http://technoratimedia.com/" onclick="$(this).track('technoratimedia-image');"><img src="http://web.archive.org/web/20090221150230im_/http://static.technorati.com/static/images/global/technoratimedia-logo.png" alt="Technorati Media"/></a></div> </li> </ul> </div> <div style="clear: both;"></div> </div></div> <div id="footer-links" onclick="$(this).track('/global-footer');"> <ul> <li>© Technorati, Inc.</li> <li><a href="http://web.archive.org/web/20090221150230/http://www.technorati.jp/" onclick="$(this).track('technorati-japan');">Technorati Japan</a></li> <li><a href="/web/20090221150230/http://technorati.com/ping/" onclick="$(this).track('ping');">Ping Us</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://creativecommons.org/licenses/by-nc/3.0/" rel="license" title="Creative Commons Attribution-NonCommercial License" onclick="$(this).track('creative-commons-license');">CC License</a></li> <li><a href="/web/20090221150230/http://technorati.com/about/tos.html" onclick="$(this).track('terms-of-service');">Terms of Service</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://technoratimedia.com/" onclick="$(this).track('about-us');">About Us</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://technoratimedia.com/contact/" onclick="$(this).track('contact-us');">Contact Us</a></li> <li><a href="http://web.archive.org/web/20090221150230/http://technoratimedia.com/advertisers/" onclick="$(this).track('advertise');">Advertise</a></li> </ul> </div> <!-- elapsed render: 0.005 10.11.16.144 --> <script type="text/javascript"> pageTracker._trackPageview(); </script> <script type="text/javascript" src="http://web.archive.org/web/20090221150230js_/http://js.revsci.net/gateway/gw.js?csid=A09797"></script> <script type="text/javascript"> <!-- DM_tag(); //--></script> </body> </html> <!-- FILE ARCHIVED ON 15:02:30 Feb 21, 2009 AND RETRIEVED FROM THE INTERNET ARCHIVE ON 16:46:28 Nov 25, 2024. JAVASCRIPT APPENDED BY WAYBACK MACHINE, COPYRIGHT INTERNET ARCHIVE. ALL OTHER CONTENT MAY ALSO BE PROTECTED BY COPYRIGHT (17 U.S.C. SECTION 108(a)(3)). --> <!-- playback timings (ms): captures_list: 0.591 exclusion.robots: 0.029 exclusion.robots.policy: 0.017 esindex: 0.01 cdx.remote: 7.814 LoadShardBlock: 66.941 (3) PetaboxLoader3.datanode: 74.736 (4) load_resource: 160.379 PetaboxLoader3.resolve: 129.177 -->