findory.com - information about domain
- Server Status: available
- Server IP: 64.94.136.5
- Server Response Time: 402ms
Site title
Geeking with Greg: A brief history of Findory
Alexa information
Alexa rank: 12,967,184
Rank Trend
Bounce Trend
DNS Information
| Host: | Class: | Type: | IP: | TTL: | Target: | Other: |
| findory.com | IN | A | 64.94.136.5 | 3600 | ||
| findory.com | IN | SOA | 3600 | mname: dns1.nettica.com rname: hostmaster.nettica.com serial: 2005011916 refresh: 7200 retry: 1800 expire: 604800 minimum-ttl: 3600 |
||
| findory.com | IN | MX | 3600 | aspmx.l.google.com | pri: 5 | |
| findory.com | IN | MX | 3600 | alt1.aspmx.l.google.com | pri: 10 | |
| findory.com | IN | MX | 3600 | alt2.aspmx.l.google.com | pri: 10 | |
| findory.com | IN | MX | 3600 | aspmx2.googlemail.com | pri: 20 | |
| findory.com | IN | MX | 3600 | aspmx3.googlemail.com | pri: 20 | |
| findory.com | IN | MX | 3600 | aspmx4.googlemail.com | pri: 20 | |
| findory.com | IN | MX | 3600 | aspmx5.googlemail.com | pri: 20 | |
| findory.com | IN | NS | 3600 | dns2.nettica.com | ||
| findory.com | IN | NS | 3600 | dns5.nettica.com | ||
| findory.com | IN | NS | 3600 | dns4.nettica.com | ||
| findory.com | IN | NS | 3600 | dns1.nettica.com | ||
| findory.com | IN | NS | 3600 | dns3.nettica.com |
Server Location
Site source
Show / hide source
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
<html dir='ltr' xmlns='http://www.w3.org/1999/xhtml' xmlns:b='http://www.google.com/2005/gml/b' xmlns:data='http://www.google.com/2005/gml/data' xmlns:expr='http://www.google.com/2005/gml/expr'>
<head>
<meta content='text/html; charset=UTF-8' http-equiv='Content-Type'/>
<script type="text/javascript">(function() { var a=window;function c(b){this.t={};this.tick=function(b,i,d){d=void 0!=d?d:(new Date).getTime();this.t[b]=[d,i]};this.tick("start",null,b)}var f=new c;a.jstiming={Timer:c,load:f};try{var g=null;a.chrome&&a.chrome.csi&&(g=Math.floor(a.chrome.csi().pageT));null==g&&a.gtbExternal&&(g=a.gtbExternal.pageT());null==g&&a.external&&(g=a.external.pageT);g&&(a.jstiming.pt=g)}catch(h){};a.tickAboveFold=function(b){var e=0;if(b.offsetParent){do e+=b.offsetTop;while(b=b.offsetParent)}b=e;750>=b&&a.jstiming.load.tick("aft")};var j=!1;function k(){j||(j=!0,a.jstiming.load.tick("firstScrollTime"))}a.addEventListener?a.addEventListener("scroll",k,!1):a.attachEvent("onscroll",k);
})();</script>
<meta content='true' name='MSSmartTagsPreventParsing'/>
<meta content='blogger' name='generator'/>
<link href='http://glinden.blogspot.com/favicon.ico' rel='icon' type='image/x-icon'/>
<link href='http://glinden.blogspot.com/2008/01/brief-history-of-findory.html' rel='canonical'/>
<link rel="alternate" type="application/atom+xml" title="Geeking with Greg - Atom" href="http://glinden.blogspot.com/feeds/posts/default" />
<link rel="alternate" type="application/rss+xml" title="Geeking with Greg - RSS" href="http://glinden.blogspot.com/feeds/posts/default?alt=rss" />
<link rel="service.post" type="application/atom+xml" title="Geeking with Greg - Atom" href="http://www.blogger.com/feeds/6569681/posts/default" />
<link rel="EditURI" type="application/rsd+xml" title="RSD" href="http://www.blogger.com/rsd.g?blogID=6569681" />
<link rel="alternate" type="application/atom+xml" title="Geeking with Greg - Atom" href="http://glinden.blogspot.com/feeds/74972892038797195/comments/default" />
<link rel="image_src" href="http://4.bp.blogspot.com/_JQ7fxW3ASg4/R31D8GGgdQI/AAAAAAAACPw/y8eBhxfCQDE/s72-c/Findory-banner-logo.jpg" />
<!--[if IE]> <script> (function() { var html5 = ("abbr,article,aside,audio,canvas,datalist,details," + "figure,footer,header,hgroup,mark,menu,meter,nav,output," + "progress,section,time,video").split(','); for (var i = 0; i < html5.length; i++) { document.createElement(html5[i]); } try { document.execCommand('BackgroundImageCache', false, true); } catch(e) {} })(); </script> <![endif]-->
<title>Geeking with Greg: A brief history of Findory</title>
<link type='text/css' rel='stylesheet' href='http://www.blogger.com/static/v1/widgets/3432093398-widget_css_bundle.css' />
<link type="text/css" rel="stylesheet" href="http://www.blogger.com/dyn-css/authorization.css?targetBlogID=6569681&zx=3531bebc-6391-459a-a798-46c52f6505dd"/>
<style type="text/css">
#navbar-iframe { display:block }
</style>
<style id='page-skin-1' type='text/css'><!--
/*
-----------------------------------------------
Blogger Template Style
Name: Denim
Designer: Darren Delaye
URL: www.DarrenDelaye.com
Date: 11 Jul 2006
-----------------------------------------------
*/
/* Variable definitions
====================
<Variable name="bgColor" description="Page Background Color"
type="color" default="#efefef">
<Variable name="textColor" description="Text Color"
type="color" default="#333333">
<Variable name="linkColor" description="Link Color"
type="color" default="#336699">
<Variable name="headerBgColor" description="Page Header Background Color"
type="color" default="#336699">
<Variable name="headerTextColor" description="Page Header Text Color"
type="color" default="#ffffff">
<Variable name="headerCornersColor" description="Page Header Corners Color"
type="color" default="#528bc5">
<Variable name="mainBgColor" description="Main Background Color"
type="color" default="#ffffff">
<Variable name="borderColor" description="Border Color"
type="color" default="#cccccc">
<Variable name="dateHeaderColor" description="Date Header Color"
type="color" default="#999999">
<Variable name="sidebarTitleBgColor" description="Sidebar Title Background Color"
type="color" default="#ffd595">
<Variable name="sidebarTitleTextColor" description="Sidebar Title Text Color"
type="color" default="#333333">
<Variable name="bodyFont" description="Text Font"
type="font" default="normal normal 100% Verdana, Arial, Sans-serif;">
<Variable name="headerFont" description="Page Header Font"
type="font" default="normal normal 210% Verdana, Arial, Sans-serif;">
<Variable name="startSide" description="Start side in blog language"
type="automatic" default="left">
<Variable name="endSide" description="End side in blog language"
type="automatic" default="right">
*/
body {
background: #efefef;
margin: 0;
padding: 0px;
font: x-small Verdana, Arial;
text-align: center;
color: #333333;
font-size/* */:/**/small;
font-size: /**/small;
}
a:link {
color: #336699;
}
a:visited {
color: #336699;
}
a img {
border-width: 0;
}
#outer-wrapper {
font: normal normal 100% Verdana, Arial, Sans-serif;;
}
/* Header
----------------------------------------------- */
#header-wrapper {
margin:0;
padding: 0;
background-color: #304060;
text-align: left;
}
#header {
width: 760px;
margin: 0 auto;
background-color: #102040;
border: 1px solid #102040;
color: #eeeeee;
padding: 0;
font: normal normal 210% Verdana, Arial, Sans-serif;;
}
h1.title {
padding-top: 38px;
margin: 0 14px .1em;
line-height: 1.2em;
font-size: 100%;
}
h1.title a, h1.title a:visited {
color: #eeeeee;
text-decoration: none;
}
#header .description {
display: block;
margin: 0 14px;
padding: 0 0 40px;
line-height: 1.4em;
font-size: 50%;
}
/* Content
----------------------------------------------- */
.clear {
clear: both;
}
#content-wrapper {
width: 760px;
margin: 0 auto;
padding: 0 0 15px;
text-align: left;
background-color: #ffffff;
border: 1px solid #cccccc;
border-top: 0;
}
#main-wrapper {
margin-left: 14px;
width: 464px;
float: left;
background-color: #ffffff;
display: inline; /* fix for doubling margin in IE */
word-wrap: break-word; /* fix for long text breaking sidebar float in IE */
overflow: hidden; /* fix for long non-text content breaking IE sidebar float */
}
#sidebar-wrapper {
margin-right: 14px;
width: 240px;
float: right;
background-color: #ffffff;
display: inline; /* fix for doubling margin in IE */
word-wrap: break-word; /* fix for long text breaking sidebar float in IE */
overflow: hidden; /* fix for long non-text content breaking IE sidebar float */
}
/* Headings
----------------------------------------------- */
h2, h3 {
margin: 0;
}
/* Posts
----------------------------------------------- */
.date-header {
margin: 1.5em 0 0;
font-weight: normal;
color: #777777;
font-size: 100%;
}
.post {
margin: 0 0 1.5em;
padding-bottom: 1.5em;
}
.post-title {
margin: 0;
padding: 0;
font-size: 125%;
font-weight: bold;
line-height: 1.1em;
}
.post-title a, .post-title a:visited, .post-title strong {
text-decoration: none;
color: #333333;
font-weight: bold;
}
.post div {
margin: 0 0 .75em;
line-height: 1.3em;
}
.post-footer {
margin: -.25em 0 0;
color: #333333;
font-size: 87%;
}
.post-footer .span {
margin-right: .3em;
}
.post img, table.tr-caption-container {
padding: 4px;
border: 1px solid #cccccc;
}
.tr-caption-container img {
border: none;
padding: 0;
}
.post blockquote {
margin: 1em 20px;
}
.post blockquote p {
margin: .75em 0;
}
/* Comments
----------------------------------------------- */
#comments h4 {
margin: 1em 0;
color: #777777;
}
#comments h4 strong {
font-size: 110%;
}
#comments-block {
margin: 1em 0 1.5em;
line-height: 1.3em;
}
#comments-block dt {
margin: .5em 0;
}
#comments-block dd {
margin: .25em 0 0;
}
#comments-block dd.comment-footer {
margin: -.25em 0 2em;
line-height: 1.4em;
font-size: 78%;
}
#comments-block dd p {
margin: 0 0 .75em;
}
.deleted-comment {
font-style:italic;
color:gray;
}
.feed-links {
clear: both;
line-height: 2.5em;
}
#blog-pager-newer-link {
float: left;
}
#blog-pager-older-link {
float: right;
}
#blog-pager {
text-align: center;
}
/* Sidebar Content
----------------------------------------------- */
.sidebar h2 {
margin: 1.6em 0 .5em;
padding: 4px 5px;
background-color: #ffd595;
font-size: 100%;
color: #333333;
}
.sidebar ul {
margin: 0;
padding: 0;
list-style: none;
}
.sidebar li {
margin: 0;
padding-top: 0;
padding-right: 0;
padding-bottom: .5em;
padding-left: 15px;
text-indent: -15px;
line-height: 1.5em;
}
.sidebar {
color: #333333;
line-height:1.3em;
}
.sidebar .widget {
margin-bottom: 1em;
}
.sidebar .widget-content {
margin: 0 5px;
}
/* Profile
----------------------------------------------- */
.profile-img {
float: left;
margin-top: 0;
margin-right: 5px;
margin-bottom: 5px;
margin-left: 0;
padding: 4px;
border: 1px solid #cccccc;
}
.profile-data {
margin:0;
text-transform:uppercase;
letter-spacing:.1em;
font-weight: bold;
line-height: 1.6em;
font-size: 78%;
}
.profile-datablock {
margin:.5em 0 .5em;
}
.profile-textblock {
margin: 0.5em 0;
line-height: 1.6em;
}
/* Footer
----------------------------------------------- */
#footer {
clear: both;
text-align: center;
color: #333333;
}
#footer .widget {
margin:.5em;
padding-top: 20px;
font-size: 85%;
line-height: 1.5em;
text-align: left;
}
--></style>
<script type="text/javascript">(function(){if(-1!=navigator.userAgent.indexOf("Mobile")&&-1!=navigator.userAgent.indexOf("WebKit")&&-1==navigator.userAgent.indexOf("iPad")||-1!=navigator.userAgent.indexOf("Opera Mini")){var a;a:{var b=window.location.href,c=b.split("?");switch(c.length){case 1:a=b+"?m=1";break a;case 2:a=0<=c[1].search("(^|&)m=")?null:b+"&m=1";break a;default:a=null}}a&&window.location.replace(a)};})();
</script><script type="text/javascript">
if (window.jstiming) window.jstiming.load.tick('headEnd');
</script></head>
<body>
<div class='navbar section' id='navbar'><div class='widget Navbar' id='Navbar1'><script type="text/javascript">
function setAttributeOnload(object, attribute, val) {
if(window.addEventListener) {
window.addEventListener("load",
function(){ object[attribute] = val; }, false);
} else {
window.attachEvent('onload', function(){ object[attribute] = val; });
}
}
</script>
<iframe src="http://www.blogger.com/navbar.g?targetBlogID=6569681&blogName=Geeking+with+Greg&publishMode=PUBLISH_MODE_BLOGSPOT&navbarType=BLUE&layoutType=LAYOUTS&searchRoot=http://glinden.blogspot.com/search&blogLocale=en_US&homepageUrl=http://glinden.blogspot.com/&targetPostID=74972892038797195&vt=343804146203103123" marginwidth="0" marginheight="0" scrolling="no" frameborder="0" height="30px" width="100%" id="navbar-iframe" allowtransparency="true" title="Blogger Navigation and Search"></iframe>
<div></div><script type="text/javascript">
(function() {
var script = document.createElement('script');
script.type = 'text/javascript';
script.src = '//pagead2.googlesyndication.com/pagead/js/google_top.js';
var head = document.getElementsByTagName('head')[0];
if (head) {
head.appendChild(script);
}})();
</script>
</div></div>
<div id='outer-wrapper'><div id='wrap2'>
<!-- skip links for text browsers -->
<span id='skiplinks' style='display:none;'>
<a href='#main'>skip to main </a> |
<a href='#sidebar'>skip to sidebar</a>
</span>
<div id='header-wrapper'>
<div class='header section' id='header'><div class='widget Header' id='Header1'>
<div id='header-inner'>
<div class='titlewrapper'>
<h1 class='title'>
<a href='http://glinden.blogspot.com/'>Geeking with Greg</a>
</h1>
</div>
<div class='descriptionwrapper'>
<p class='description'><span>
</span></p>
</div>
</div>
</div></div>
</div>
<div id='content-wrapper'>
<div id='crosscol-wrapper' style='text-align:center'>
<div class='crosscol section' id='crosscol'></div>
</div>
<div id='main-wrapper'>
<div class='main section' id='main'><div class='widget Blog' id='Blog1'>
<div class='blog-posts hfeed'>
<!-- google_ad_section_start(name=default) -->
<div class="date-outer">
<h2 class='date-header'><span>Thursday, January 03, 2008</span></h2>
<div class="date-posts">
<div class='post-outer'>
<div class='post hentry'>
<a name='74972892038797195'></a>
<h3 class='post-title entry-title'>
A brief history of Findory
</h3>
<div class='post-header'>
<div class='post-header-line-1'></div>
</div>
<div class='post-body entry-content' id='post-body-74972892038797195'>
<img style="float:right; margin:0 0 10px 10px;" src="http://4.bp.blogspot.com/_JQ7fxW3ASg4/R31D8GGgdQI/AAAAAAAACPw/y8eBhxfCQDE/s320/Findory-banner-logo.jpg" border="0" alt="Findory logo" id="BLOGGER_PHOTO_ID_5151348248490833154" />Findory was a personalized news site. The site launched in January 2004 and shut down November 2007.<br /><br />A reader first coming to Findory would see a normal front page of news, the popular and important news stories of the day. When someone read articles on the site, Findory learned what stories interested that reader and changed the news that was featured to match that reader's interests. In this way, Findory built each reader a personalized front page of news.<br /><br />Below is a screenshot of an example personalized Findory home page. Articles marked with a sunburst icon are personalized, picked specifically for this reader based on this person's reading history.<br /><br /><a onblur="try {parent.deselectBloggerImageGracefully();} catch(e) {}" href="http://2.bp.blogspot.com/_JQ7fxW3ASg4/R31KHmGgdSI/AAAAAAAACQA/XCO8vTYWviY/s1600-h/Findory+home+page+cropped.jpg"><img style="display:block; margin:0px auto 10px; text-align:center;cursor:pointer; cursor:hand;" src="http://4.bp.blogspot.com/_JQ7fxW3ASg4/R31KCGGgdRI/AAAAAAAACP4/lNBK43tHeG8/s320/Findory+home+page+cropped+thumbnail.jpg" border="0" alt=""id="BLOGGER_PHOTO_ID_5151347827584038114" /></a><center><small>[Clicking on the screenshot will bring up a full-sized version]</small></center><br />Findory's personalization used a type of hybrid collaborative filtering algorithm that recommended articles based on a combination of similarity of content and articles that tended to interested other Findory users with similar tastes.<br /><br />One way to think of this is that, when a person found and read an interesting article on Findory, that article would be shared with any other Findory readers who likely would be interested. Likewise, that person would benefit from interesting articles other Findory readers found. All this sharing of articles was done implicitly and anonymously without any effort from readers by Findory's recommendation engine.<br /><br />Findory's news recommendations were unusual in that they were primarily based on user behavior (what articles other readers had found), worked from very little data (starting after a single click on Findory), worked in real-time (changed immediately when someone read an article), required no set-up or configuration (worked just by watching articles read), and did not readers to identify themselves (no login necessary).<br /><br />Findory's primary product was in news, but the broader goal of Findory was to personalize information. Toward that, Findory had alpha features that would recommend videos, podcasts, feeds, advertisements, and web search results.<br /><br />Video, podcast, and feed recommendations worked much like the news recommendations. The advertisement recommendations were an unusual form of fine-grained personalized advertising that attempted to target advertisements based not only on the content of the page, but also a person's reading history on Findory. The web search was an unusual form of fine-grained personalized web search that modified Google search results to feature items clicked on by searchers with similar search behavior (recommendations) or that were clicked on by this specific searcher in the past (re-finding).<br /><br />At its height, Findory was a popular website with over 100k unique visitors and 5M page views per month. Findory was well reviewed and received press coverage in the Wall Street Journal, Forbes, Time Magazine, PC World, The Times, Spiegel, Seattle PI, Seattle Times, Puget Sound Business Journal, KPLU, Slate, and elsewhere.<br /><br />More information and more details on Findory's history can be found in my <a href="http://www.google.com/search?q=allintitle%3Afindory+site%3Aglinden.blogspot.com">many previous posts</a> on Findory.
<div style='clear: both;'></div>
</div>
<div class='post-footer'>
<div class='post-footer-line post-footer-line-1'><span class='post-author vcard'>
Posted by
<span class='fn'>Greg Linden</span>
</span>
<span class='post-timestamp'>
at
<a class='timestamp-link' href='http://glinden.blogspot.com/2008/01/brief-history-of-findory.html' rel='bookmark' title='permanent link'><abbr class='published' title='2008-01-03T11:46:00-08:00'>11:46 AM</abbr></a>
</span>
<span class='post-comment-link'>
</span>
<span class='post-icons'>
</span>
<div class='post-share-buttons goog-inline-block'>
<a class='goog-inline-block share-button sb-email' href='http://www.blogger.com/share-post.g?blogID=6569681&postID=74972892038797195&target=email' target='_blank' title='Email This'><span class='share-button-link-text'>Email This</span></a><a class='goog-inline-block share-button sb-blog' href='http://www.blogger.com/share-post.g?blogID=6569681&postID=74972892038797195&target=blog' onclick='window.open(this.href, "_blank", "height=270,width=475"); return false;' target='_blank' title='BlogThis!'><span class='share-button-link-text'>BlogThis!</span></a><a class='goog-inline-block share-button sb-twitter' href='http://www.blogger.com/share-post.g?blogID=6569681&postID=74972892038797195&target=twitter' target='_blank' title='Share to Twitter'><span class='share-button-link-text'>Share to Twitter</span></a><a class='goog-inline-block share-button sb-facebook' href='http://www.blogger.com/share-post.g?blogID=6569681&postID=74972892038797195&target=facebook' onclick='window.open(this.href, "_blank", "height=430,width=640"); return false;' target='_blank' title='Share to Facebook'><span class='share-button-link-text'>Share to Facebook</span></a><div class='goog-inline-block dummy-container'><g:plusone source='blogger' href='http://glinden.blogspot.com/2008/01/brief-history-of-findory.html' size='medium' width='300' annotation='inline'/></div>
</div>
</div>
<div class='post-footer-line post-footer-line-2'></div>
<div class='post-footer-line post-footer-line-3'></div>
</div>
</div>
<div class='comments' id='comments'>
<a name='comments'></a>
<h4>
6
comments:
</h4>
<div id='Blog1_comments-block-wrapper'>
<dl class='avatar-comment-indent' id='comments-block'>
<dt class='comment-author ' id='c8825796390721378877'>
<a name='c8825796390721378877'></a>
<div class="avatar-image-container avatar-stock"><span dir="ltr"><a href="http://www.blogger.com/profile/10262558769855915929" rel="nofollow" onclick="" class="avatar-hovercard" id="av-0-10262558769855915929"><img src="http://img2.blogblog.com/img/b16-rounded.gif" width="16" height="16" alt="" title="Dean">
</a></span></div>
<a href='http://www.blogger.com/profile/10262558769855915929' rel='nofollow'>Dean</a>
said...
</dt>
<dd class='comment-body' id='Blog1_cmt-8825796390721378877'>
<p>
Greg, how do you filter out multiple articles that are basically the same article that are generated from article submission software such as Artemis Pro? Just curious and thanks.
</p>
</dd>
<dd class='comment-footer'>
<span class='comment-timestamp'>
<a href='http://glinden.blogspot.com/2008/01/brief-history-of-findory.html?showComment=1201150440000#c8825796390721378877' title='comment permalink'>
January 23, 2008 8:54 PM
</a>
<span class='item-control blog-admin pid-1176926213'>
<a class='comment-delete' href='http://www.blogger.com/delete-comment.g?blogID=6569681&postID=8825796390721378877' title='Delete Comment'>
<img src='//www.blogger.com/img/icon_delete13.gif'/>
</a>
</span>
</span>
</dd>
<dt class='comment-author ' id='c2867220097152741625'>
<a name='c2867220097152741625'></a>
<div class="avatar-image-container avatar-stock"><span dir="ltr"><img src="http://img1.blogblog.com/img/blank.gif" width="16" height="16" alt="" title="Herve">
</span></div>
Herve
said...
</dt>
<dd class='comment-body' id='Blog1_cmt-2867220097152741625'>
<p>
Why did your site was stopped ?
</p>
</dd>
<dd class='comment-footer'>
<span class='comment-timestamp'>
<a href='http://glinden.blogspot.com/2008/01/brief-history-of-findory.html?showComment=1210412880000#c2867220097152741625' title='comment permalink'>
May 10, 2008 2:48 AM
</a>
<span class='item-control blog-admin pid-950740713'>
<a class='comment-delete' href='http://www.blogger.com/delete-comment.g?blogID=6569681&postID=2867220097152741625' title='Delete Comment'>
<img src='//www.blogger.com/img/icon_delete13.gif'/>
</a>
</span>
</span>
</dd>
<dt class='comment-author ' id='c6775835844047792063'>
<a name='c6775835844047792063'></a>
<div class="avatar-image-container avatar-stock"><span dir="ltr"><img src="http://img1.blogblog.com/img/blank.gif" width="16" height="16" alt="" title="Anonymous">
</span></div>
Anonymous
said...
</dt>
<dd class='comment-body' id='Blog1_cmt-6775835844047792063'>
<p>
To this day I miss findory. I never found an alternative.
</p>
</dd>
<dd class='comment-footer'>
<span class='comment-timestamp'>
<a href='http://glinden.blogspot.com/2008/01/brief-history-of-findory.html?showComment=1234629240000#c6775835844047792063' title='comment permalink'>
February 14, 2009 8:34 AM
</a>
<span class='item-control blog-admin pid-694994277'>
<a class='comment-delete' href='http://www.blogger.com/delete-comment.g?blogID=6569681&postID=6775835844047792063' title='Delete Comment'>
<img src='//www.blogger.com/img/icon_delete13.gif'/>
</a>
</span>
</span>
</dd>
<dt class='comment-author ' id='c3510271374741826146'>
<a name='c3510271374741826146'></a>
<div class="avatar-image-container avatar-stock"><span dir="ltr"><img src="http://img1.blogblog.com/img/blank.gif" width="16" height="16" alt="" title="Anonymous">
</span></div>
Anonymous
said...
</dt>
<dd class='comment-body' id='Blog1_cmt-3510271374741826146'>
<p>
Nice to read about Findory, thanks
</p>
</dd>
<dd class='comment-footer'>
<span class='comment-timestamp'>
<a href='http://glinden.blogspot.com/2008/01/brief-history-of-findory.html?showComment=1244417037696#c3510271374741826146' title='comment permalink'>
June 7, 2009 4:23 PM
</a>
<span class='item-control blog-admin pid-318982928'>
<a class='comment-delete' href='http://www.blogger.com/delete-comment.g?blogID=6569681&postID=3510271374741826146' title='Delete Comment'>
<img src='//www.blogger.com/img/icon_delete13.gif'/>
</a>
</span>
</span>
</dd>
<dt class='comment-author ' id='c8856943973031912770'>
<a name='c8856943973031912770'></a>
<div class="avatar-image-container avatar-stock"><span dir="ltr"><img src="http://img1.blogblog.com/img/blank.gif" width="16" height="16" alt="" title="Anonymous">
</span></div>
Anonymous
said...
</dt>
<dd class='comment-body' id='Blog1_cmt-8856943973031912770'>
<p>
filtering out multiple articles that are basically the same article can be done using MinHash
</p>
</dd>
<dd class='comment-footer'>
<span class='comment-timestamp'>
<a href='http://glinden.blogspot.com/2008/01/brief-history-of-findory.html?showComment=1275466793288#c8856943973031912770' title='comment permalink'>
June 2, 2010 1:19 AM
</a>
<span class='item-control blog-admin pid-138385343'>
<a class='comment-delete' href='http://www.blogger.com/delete-comment.g?blogID=6569681&postID=8856943973031912770' title='Delete Comment'>
<img src='//www.blogger.com/img/icon_delete13.gif'/>
</a>
</span>
</span>
</dd>
<dt class='comment-author blog-author' id='c2914768408503434277'>
<a name='c2914768408503434277'></a>
<div class="avatar-image-container avatar-stock"><span dir="ltr"><a href="http://www.blogger.com/profile/09216403000599463072" rel="nofollow" onclick="" class="avatar-hovercard" id="av-5-09216403000599463072"><img src="http://img2.blogblog.com/img/b16-rounded.gif" width="16" height="16" alt="" title="Greg Linden">
</a></span></div>
<a href='http://www.blogger.com/profile/09216403000599463072' rel='nofollow'>Greg Linden</a>
said...
</dt>
<dd class='comment-body' id='Blog1_cmt-2914768408503434277'>
<p>
In general, to filter out near dups, you need to define a similarity metric and then eliminate articles under some threshold of similarity.<br /><br />A common technique used for web search is to hash a bunch of signatures for sections of the page (usually after preprocessing to strip off the navigation elements of the page, advertising, etc.) and then consider the pages near duplicates if enough of the signatures match.<br /><br />There are a lot of papers on the topic if you want to dive in. See<br /><br /><a href="http://scholar.google.com/scholar?hl=en&q=near+duplicate+documents" rel="nofollow">http://scholar.google.com/scholar?hl=en&q=near+duplicate+documents</a>
</p>
</dd>
<dd class='comment-footer'>
<span class='comment-timestamp'>
<a href='http://glinden.blogspot.com/2008/01/brief-history-of-findory.html?showComment=1275489522890#c2914768408503434277' title='comment permalink'>
June 2, 2010 7:38 AM
</a>
<span class='item-control blog-admin pid-1881361918'>
<a class='comment-delete' href='http://www.blogger.com/delete-comment.g?blogID=6569681&postID=2914768408503434277' title='Delete Comment'>
<img src='//www.blogger.com/img/icon_delete13.gif'/>
</a>
</span>
</span>
</dd>
</dl>
</div>
<p class='comment-footer'>
<a href='http://www.blogger.com/comment.g?blogID=6569681&postID=74972892038797195' onclick=''>Post a Comment</a>
</p>
<div id='backlinks-container'>
<div id='Blog1_backlinks-container'>
</div>
</div>
</div>
</div>
</div></div>
<!-- google_ad_section_end -->
</div>
<div class='blog-pager' id='blog-pager'>
<span id='blog-pager-newer-link'>
<a class='blog-pager-newer-link' href='http://glinden.blogspot.com/2008/01/coming-2008-dot-com-crash.html' id='Blog1_blog-pager-newer-link' title='Newer Post'>Newer Post</a>
</span>
<span id='blog-pager-older-link'>
<a class='blog-pager-older-link' href='http://glinden.blogspot.com/2008/01/upcoming-yahoo-talk-on-computational.html' id='Blog1_blog-pager-older-link' title='Older Post'>Older Post</a>
</span>
<a class='home-link' href='http://glinden.blogspot.com/'>Home</a>
</div>
<div class='clear'></div>
<div class='post-feeds'>
<div class='feed-links'>
Subscribe to:
<a class='feed-link' href='http://glinden.blogspot.com/feeds/74972892038797195/comments/default' target='_blank' type='application/atom+xml'>Post Comments (Atom)</a>
</div>
</div>
<script type="text/javascript">window.___gcfg = {'lang': 'en_US'};window.___gapisync = false;(function() {var po = document.createElement('script');po.type = 'text/javascript';po.async = true;po.src = 'https://apis.google.com/js/plusone.js';var s = document.body.getElementsByTagName('script')[0];s.parentNode.insertBefore(po, s);})();</script>
</div></div>
</div>
<div id='sidebar-wrapper'>
<div class='sidebar section' id='sidebar'><div class='widget HTML' id='HTML3'>
<h2 class='title'>About Me</h2>
<div class='widget-content'>
<a href="http://www.blogger.com/profile/09216403000599463072"><img alt="My Photo" width="65" src="https://sites.google.com/site/glinden/Home/glinden7.jpg" class="profile-img" height="80"/></a>
<dl class="profile-datablock">
<dt class="profile-data">Greg Linden</dt>
</dl>
<a class="profile-link" href="http://www.blogger.com/profile/09216403000599463072">View my complete profile</a>
</div>
<div class='clear'></div>
<span class='widget-item-control'>
<span class='item-control blog-admin'>
<a class='quickedit' href='http://www.blogger.com/rearrange?blogID=6569681&widgetType=HTML&widgetId=HTML3&action=editWidget§ionId=sidebar' onclick='return _WidgetManager._PopupConfig(document.getElementById("HTML3"));' target='configHTML3' title='Edit'>
<img alt='' height='18' src='http://img1.blogblog.com/img/icon18_wrench_allbkg.png' width='18'/>
</a>
</span>
</span>
<div class='clear'></div>
</div><div class='widget Text' id='Text1'>
<h2 class='title'>Subscribe to the Feed</h2>
<div class='widget-content'>
<a href="http://feeds.feedburner.com/GeekingWithGreg" rel="alternate" type="application/rss+xml"><img src="http://www.feedburner.com/fb/images/pub/feed-icon16x16.png" alt="" style="vertical-align:middle;border:0" /></a> <a href="http://feeds.feedburner.com/GeekingWithGreg" rel="alternate" type="application/rss+xml">Subscribe in a reader</a><br/><br/><span style="position: relative; left: 100px;"><a href="http://feeds.feedburner.com/GeekingWithGreg"><img src="http://feeds.feedburner.com/~fc/GeekingWithGreg?bg=99CCFF&fg=444444&anim=0" height="26" width="88" style="border:0" alt="" /></a></span>
</div>
<div class='clear'></div>
<span class='widget-item-control'>
<span class='item-control blog-admin'>
<a class='quickedit' href='http://www.blogger.com/rearrange?blogID=6569681&widgetType=Text&widgetId=Text1&action=editWidget§ionId=sidebar' onclick='return _WidgetManager._PopupConfig(document.getElementById("Text1"));' target='configText1' title='Edit'>
<img alt='' height='18' src='http://img1.blogblog.com/img/icon18_wrench_allbkg.png' width='18'/>
</a>
</span>
</span>
<div class='clear'></div>
</div><div class='widget TextList' id='TextList1'>
<h2>More Geeking with Me</h2>
<div class='widget-content'>
<ul>
<li><a href="http://twitter.com/greglinden" target="_new">Tweeting with Greg</a></li>
<li><a href="https://plus.google.com/102076128417589427747/posts" target="_new">Geeking on G+</a></li>
</ul>
<div class='clear'></div>
<span class='widget-item-control'>
<span class='item-control blog-admin'>
<a class='quickedit' href='http://www.blogger.com/rearrange?blogID=6569681&widgetType=TextList&widgetId=TextList1&action=editWidget§ionId=sidebar' onclick='return _WidgetManager._PopupConfig(document.getElementById("TextList1"));' target='configTextList1' title='Edit'>
<img alt='' height='18' src='http://img1.blogblog.com/img/icon18_wrench_allbkg.png' width='18'/>
</a>
</span>
</span>
<div class='clear'></div>
</div>
</div><div class='widget BlogArchive' id='BlogArchive1'>
<h2>Blog Archive</h2>
<div class='widget-content'>
<div id='ArchiveList'>
<div id='BlogArchive1_ArchiveList'>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/search?updated-min=2012-01-01T00:00:00-08:00&updated-max=2013-01-01T00:00:00-08:00&max-results=3'>2012</a>
<span class='post-count' dir='ltr'>(3)</span>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2012_03_01_archive.html'>March</a>
<span class='post-count' dir='ltr'>(2)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2012/03/quick-links.html'>Quick links</a></li>
<li><a href='http://glinden.blogspot.com/2012/03/ad-targeting-at-yahoo.html'>Ad targeting at Yahoo</a></li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2012_01_01_archive.html'>January</a>
<span class='post-count' dir='ltr'>(1)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2012/01/more-quick-links.html'>More quick links</a></li>
</ul>
</li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/search?updated-min=2011-01-01T00:00:00-08:00&updated-max=2012-01-01T00:00:00-08:00&max-results=24'>2011</a>
<span class='post-count' dir='ltr'>(24)</span>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2011_12_01_archive.html'>December</a>
<span class='post-count' dir='ltr'>(1)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2011/12/quick-links.html'>Quick links</a></li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2011_11_01_archive.html'>November</a>
<span class='post-count' dir='ltr'>(3)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2011/11/browsing-behavior-for-web-crawling.html'>Browsing behavior for web crawling</a></li>
<li><a href='http://glinden.blogspot.com/2011/11/what-mobile-location-data-looks-like-to.html'>What mobile location data looks like to Google</a></li>
<li><a href='http://glinden.blogspot.com/2011/11/even-more-quick-links.html'>Even more quick links</a></li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2011_10_01_archive.html'>October</a>
<span class='post-count' dir='ltr'>(1)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2011/10/more-quick-links.html'>More quick links</a></li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2011_09_01_archive.html'>September</a>
<span class='post-count' dir='ltr'>(2)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2011/09/quick-links.html'>Quick links</a></li>
<li><a href='http://glinden.blogspot.com/2011/09/blending-machines-and-humans-to-get.html'>Blending machines and humans to get very high accu...</a></li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2011_07_01_archive.html'>July</a>
<span class='post-count' dir='ltr'>(2)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2011/07/quick-links.html'>Quick links</a></li>
<li><a href='http://glinden.blogspot.com/2011/07/google-and-suggesting-friends.html'>Google and suggesting friends</a></li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2011_06_01_archive.html'>June</a>
<span class='post-count' dir='ltr'>(2)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2011/06/quick-links.html'>Quick links</a></li>
<li><a href='http://glinden.blogspot.com/2011/06/continuous-profiling-at-google.html'>Continuous profiling at Google</a></li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2011_05_01_archive.html'>May</a>
<span class='post-count' dir='ltr'>(4)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2011/05/eli-pariser-is-wrong.html'>Eli Pariser is wrong</a></li>
<li><a href='http://glinden.blogspot.com/2011/05/taking-small-steps-toward-personalized.html'>Taking small steps toward personalized search</a></li>
<li><a href='http://glinden.blogspot.com/2011/05/quick-links.html'>Quick links</a></li>
<li><a href='http://glinden.blogspot.com/2011/05/value-of-google-maps-directions-logs.html'>The value of Google Maps directions logs</a></li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2011_04_01_archive.html'>April</a>
<span class='post-count' dir='ltr'>(1)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2011/04/resurgence-of-interest-in-personalized.html'>Resurgence of interest in personalized information...</a></li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2011_03_01_archive.html'>March</a>
<span class='post-count' dir='ltr'>(2)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2011/03/latest-reading.html'>Latest reading</a></li>
<li><a href='http://glinden.blogspot.com/2011/03/personal-navigation-and-re-finding.html'>Personal navigation and re-finding</a></li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2011_02_01_archive.html'>February</a>
<span class='post-count' dir='ltr'>(4)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2011/02/what-i-have-been-reading-lately.html'>What I have been reading lately</a></li>
<li><a href='http://glinden.blogspot.com/2011/02/comparing-google-megastore.html'>Comparing Google Megastore</a></li>
<li><a href='http://glinden.blogspot.com/2011/02/google-bing-and-web-browsing-data.html'>Google, Bing, and web browsing data</a></li>
<li><a href='http://glinden.blogspot.com/2011/02/youtube-uses-amazons-recommendation.html'>YouTube uses Amazon's recommendation algorithm</a></li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2011_01_01_archive.html'>January</a>
<span class='post-count' dir='ltr'>(2)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2011/01/latest-reading.html'>Latest reading</a></li>
<li><a href='http://glinden.blogspot.com/2011/01/experiment-infrastructure-at-google.html'>The experiment infrastructure at Google</a></li>
</ul>
</li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/search?updated-min=2010-01-01T00:00:00-08:00&updated-max=2011-01-01T00:00:00-08:00&max-results=40'>2010</a>
<span class='post-count' dir='ltr'>(40)</span>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2010_12_01_archive.html'>December</a>
<span class='post-count' dir='ltr'>(2)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2010/12/papers-on-specialized-databases-at.html'>Papers on specialized databases at Google</a></li>
<li><a href='http://glinden.blogspot.com/2010/12/groupon-is-not-googly.html'>Groupon is not Googly</a></li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2010_11_01_archive.html'>November</a>
<span class='post-count' dir='ltr'>(2)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2010/11/update-on-googles-infrastructure.html'>An update on Google's infrastructure</a></li>
<li><a href='http://glinden.blogspot.com/2010/11/more-on-why-paywalls-fail.html'>More on why paywalls fail</a></li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2010_10_01_archive.html'>October</a>
<span class='post-count' dir='ltr'>(1)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2010/10/round-up-of-latest-reading.html'>Round-up of latest reading</a></li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2010_09_01_archive.html'>September</a>
<span class='post-count' dir='ltr'>(5)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2010/09/eric-schmidt-on-automatic-search.html'>Eric Schmidt on automatic search</a></li>
<li><a href='http://glinden.blogspot.com/2010/09/causing-internal-competition-and-low.html'>Causing internal competition and low morale throug...</a></li>
<li><a href='http://glinden.blogspot.com/2010/09/cuil-is-dead.html'>Cuil is dead</a></li>
<li><a href='http://glinden.blogspot.com/2010/09/machine-learning-on-top-of-gfs-at.html'>Machine learning on top of GFS at Google</a></li>
<li><a href='http://glinden.blogspot.com/2010/09/insights-into-performance-of-microsofts.html'>Insights into the performance of Microsoft's big c...</a></li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2010_08_01_archive.html'>August</a>
<span class='post-count' dir='ltr'>(3)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2010/08/what-is-benefit-of-freaking-customers.html'>What is the benefit of freaking customers out?</a></li>
<li><a href='http://glinden.blogspot.com/2010/08/measuring-online-brand-advertising.html'>Measuring online brand advertising without experim...</a></li>
<li><a href='http://glinden.blogspot.com/2010/08/human-computation-and-lemons.html'>Human computation and lemons</a></li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2010_07_01_archive.html'>July</a>
<span class='post-count' dir='ltr'>(1)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2010/07/big-redesign-at-google-news.html'>Big redesign at Google News</a></li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2010_06_01_archive.html'>June</a>
<span class='post-count' dir='ltr'>(5)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2010/06/google-to-personalize-metashopping.html'>Google to personalize metashopping</a></li>
<li><a href='http://glinden.blogspot.com/2010/06/google-on-presentation-bias-in-search.html'>Google on presentation bias in search</a></li>
<li><a href='http://glinden.blogspot.com/2010/06/travel-itineraries-from-flickr-photo.html'>Travel itineraries from Flickr photo trails</a></li>
<li><a href='http://glinden.blogspot.com/2010/06/findory-buyout-offer-from-yahoo.html'>A Findory buyout offer from Yahoo?</a></li>
<li><a href='http://glinden.blogspot.com/2010/06/how-bing-predicts-ctr-of-ads.html'>How Bing predicts the CTR of ads</a></li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2010_05_01_archive.html'>May</a>
<span class='post-count' dir='ltr'>(3)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2010/05/geeking-with-greg-administrivia.html'>Geeking with Greg administrivia</a></li>
<li><a href='http://glinden.blogspot.com/2010/05/yahoo-as-internet-information-filter.html'>Yahoo as an internet information filter</a></li>
<li><a href='http://glinden.blogspot.com/2010/05/google-tries-to-save-news.html'>Google tries to save the news</a></li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2010_04_01_archive.html'>April</a>
<span class='post-count' dir='ltr'>(3)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2010/04/facebooks-moves-and-personalized.html'>Facebook's moves and personalized advertising</a></li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2010_03_01_archive.html'>March</a>
<span class='post-count' dir='ltr'>(6)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2010_02_01_archive.html'>February</a>
<span class='post-count' dir='ltr'>(4)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2010_01_01_archive.html'>January</a>
<span class='post-count' dir='ltr'>(5)</span>
</li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/search?updated-min=2009-01-01T00:00:00-08:00&updated-max=2010-01-01T00:00:00-08:00&max-results=50'>2009</a>
<span class='post-count' dir='ltr'>(62)</span>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2009_12_01_archive.html'>December</a>
<span class='post-count' dir='ltr'>(5)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2009_11_01_archive.html'>November</a>
<span class='post-count' dir='ltr'>(6)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2009_10_01_archive.html'>October</a>
<span class='post-count' dir='ltr'>(5)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2009_09_01_archive.html'>September</a>
<span class='post-count' dir='ltr'>(5)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2009_08_01_archive.html'>August</a>
<span class='post-count' dir='ltr'>(3)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2009_07_01_archive.html'>July</a>
<span class='post-count' dir='ltr'>(5)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2009_06_01_archive.html'>June</a>
<span class='post-count' dir='ltr'>(9)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2009_05_01_archive.html'>May</a>
<span class='post-count' dir='ltr'>(6)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2009_04_01_archive.html'>April</a>
<span class='post-count' dir='ltr'>(4)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2009_03_01_archive.html'>March</a>
<span class='post-count' dir='ltr'>(4)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2009_02_01_archive.html'>February</a>
<span class='post-count' dir='ltr'>(5)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2009_01_01_archive.html'>January</a>
<span class='post-count' dir='ltr'>(5)</span>
</li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate expanded'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy toggle-open'>▼ </span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/search?updated-min=2008-01-01T00:00:00-08:00&updated-max=2009-01-01T00:00:00-08:00&max-results=50'>2008</a>
<span class='post-count' dir='ltr'>(131)</span>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2008_12_01_archive.html'>December</a>
<span class='post-count' dir='ltr'>(5)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2008_11_01_archive.html'>November</a>
<span class='post-count' dir='ltr'>(10)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2008_10_01_archive.html'>October</a>
<span class='post-count' dir='ltr'>(15)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2008_09_01_archive.html'>September</a>
<span class='post-count' dir='ltr'>(2)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2008_08_01_archive.html'>August</a>
<span class='post-count' dir='ltr'>(10)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2008_07_01_archive.html'>July</a>
<span class='post-count' dir='ltr'>(15)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2008_06_01_archive.html'>June</a>
<span class='post-count' dir='ltr'>(7)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2008_05_01_archive.html'>May</a>
<span class='post-count' dir='ltr'>(15)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2008_04_01_archive.html'>April</a>
<span class='post-count' dir='ltr'>(12)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2008_03_01_archive.html'>March</a>
<span class='post-count' dir='ltr'>(14)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2008_02_01_archive.html'>February</a>
<span class='post-count' dir='ltr'>(13)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate expanded'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy toggle-open'>▼ </span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2008_01_01_archive.html'>January</a>
<span class='post-count' dir='ltr'>(13)</span>
<ul class='posts'>
<li><a href='http://glinden.blogspot.com/2008/01/incremental-caching-for-web-search.html'>Incremental caching for web search</a></li>
<li><a href='http://glinden.blogspot.com/2008/01/optimizing-web-20-applications.html'>Optimizing Web 2.0 applications</a></li>
<li><a href='http://glinden.blogspot.com/2008/01/mapreduce-step-backwards.html'>MapReduce a step backwards?</a></li>
<li><a href='http://glinden.blogspot.com/2008/01/cheap-eyetracking-using-mouse-tracking.html'>Cheap eyetracking using mouse tracking</a></li>
<li><a href='http://glinden.blogspot.com/2008/01/lambdarank-ranknet-and-msn-search.html'>LambdaRank, RankNet, and MSN Search</a></li>
<li><a href='http://glinden.blogspot.com/2008/01/predicting-satisfaction-with-search.html'>Predicting satisfaction with search</a></li>
<li><a href='http://glinden.blogspot.com/2008/01/joining-microsoft-live-labs.html'>Joining Microsoft Live Labs</a></li>
<li><a href='http://glinden.blogspot.com/2008/01/slides-on-cluster-computing-and.html'>Slides on cluster computing and MapReduce</a></li>
<li><a href='http://glinden.blogspot.com/2008/01/mapreducing-20-petabytes-per-day.html'>MapReducing 20 petabytes per day</a></li>
<li><a href='http://glinden.blogspot.com/2008/01/coming-2008-dot-com-crash.html'>The coming 2008 dot-com crash</a></li>
<li><a href='http://glinden.blogspot.com/2008/01/brief-history-of-findory.html'>A brief history of Findory</a></li>
<li><a href='http://glinden.blogspot.com/2008/01/upcoming-yahoo-talk-on-computational.html'>Upcoming Yahoo talk on computational advertising</a></li>
<li><a href='http://glinden.blogspot.com/2008/01/questions-for-2007-from-nyt.html'>Questions for 2007 from the NYT</a></li>
</ul>
</li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/search?updated-min=2007-01-01T00:00:00-08:00&updated-max=2008-01-01T00:00:00-08:00&max-results=50'>2007</a>
<span class='post-count' dir='ltr'>(212)</span>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2007_12_01_archive.html'>December</a>
<span class='post-count' dir='ltr'>(11)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2007_11_01_archive.html'>November</a>
<span class='post-count' dir='ltr'>(7)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2007_10_01_archive.html'>October</a>
<span class='post-count' dir='ltr'>(15)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2007_09_01_archive.html'>September</a>
<span class='post-count' dir='ltr'>(22)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2007_08_01_archive.html'>August</a>
<span class='post-count' dir='ltr'>(16)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2007_07_01_archive.html'>July</a>
<span class='post-count' dir='ltr'>(16)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2007_06_01_archive.html'>June</a>
<span class='post-count' dir='ltr'>(14)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2007_05_01_archive.html'>May</a>
<span class='post-count' dir='ltr'>(23)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2007_04_01_archive.html'>April</a>
<span class='post-count' dir='ltr'>(17)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2007_03_01_archive.html'>March</a>
<span class='post-count' dir='ltr'>(23)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2007_02_01_archive.html'>February</a>
<span class='post-count' dir='ltr'>(22)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2007_01_01_archive.html'>January</a>
<span class='post-count' dir='ltr'>(26)</span>
</li>
</ul>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/search?updated-min=2006-01-01T00:00:00-08:00&updated-max=2007-01-01T00:00:00-08:00&max-results=50'>2006</a>
<span class='post-count' dir='ltr'>(324)</span>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2006_12_01_archive.html'>December</a>
<span class='post-count' dir='ltr'>(17)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2006_11_01_archive.html'>November</a>
<span class='post-count' dir='ltr'>(25)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2006_10_01_archive.html'>October</a>
<span class='post-count' dir='ltr'>(21)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2006_09_01_archive.html'>September</a>
<span class='post-count' dir='ltr'>(33)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2006_08_01_archive.html'>August</a>
<span class='post-count' dir='ltr'>(30)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2006_07_01_archive.html'>July</a>
<span class='post-count' dir='ltr'>(19)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2006_06_01_archive.html'>June</a>
<span class='post-count' dir='ltr'>(23)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2006_05_01_archive.html'>May</a>
<span class='post-count' dir='ltr'>(32)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2006_04_01_archive.html'>April</a>
<span class='post-count' dir='ltr'>(27)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2006_03_01_archive.html'>March</a>
<span class='post-count' dir='ltr'>(36)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http://glinden.blogspot.com/2006_02_01_archive.html'>February</a>
<span class='post-count' dir='ltr'>(29)</span>
</li>
</ul>
<ul class='hierarchy'>
<li class='archivedate collapsed'>
<a class='toggle' href='javascript:void(0)'>
<span class='zippy'>
► 
</span>
</a>
<a class='post-count-link' href='http