<?xml version="1.0" encoding="utf-8"?>
<rss version="2.0">
<!-- MHonArc v2.6.16+ -->
  <channel>
    <title>nutch-user</title>
    <link>http://www.mail-archive.com/nutch-user@lucene.apache.org</link>
    <description>nutch-user @ lucene.apache</description>
    <pubDate>Sun, 09 May 2010 20:19:57 GMT</pubDate>
    <lastBuildDate>Sun, 09 May 2010 20:19:57 GMT</lastBuildDate>
    <docs>http://blogs.law.harvard.edu/tech/rss</docs>
    <generator>MHonArc RSS 2.0 RCFile</generator>
    <webMaster>themailarchive@gmail.com (The Mail Archive)</webMaster>
    <image>
       <title>The Mail Archive</title>
       <url>http://www.mail-archive.com/nanologo.png</url>
       <link>http://www.mail-archive.com/nutch-user@lucene.apache.org</link>
    </image>
 
    <item>
      <title>Re: full text search for java sources and subversion repository</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16426.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/09&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Andrzej Bialecki%22&quot;&gt;Andrzej Bialecki&lt;/a&gt;</description>
      <pubDate>Sun, 09 May 2010 20:19:04 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16426.html</guid>
   </item>
    <item>
      <title>Re: Wildcard search with nutch distributed search</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16425.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/09&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Andrzej Bialecki%22&quot;&gt;Andrzej Bialecki&lt;/a&gt;</description>
      <pubDate>Sun, 09 May 2010 20:16:27 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16425.html</guid>
   </item>
    <item>
      <title>full text search for java sources and subversion repository</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16424.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/09&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Rafael Kubina%22&quot;&gt;Rafael Kubina&lt;/a&gt;</description>
      <pubDate>Sun, 09 May 2010 20:03:30 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16424.html</guid>
   </item>
    <item>
      <title>Re: parse-pdf plugin with external libraries</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16423.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/09&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22JohnRodey%22&quot;&gt;JohnRodey&lt;/a&gt;</description>
      <pubDate>Sun, 09 May 2010 20:03:13 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16423.html</guid>
   </item>
    <item>
      <title>Wildcard search with nutch distributed search</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16422.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/09&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22JohnRodey%22&quot;&gt;JohnRodey&lt;/a&gt;</description>
      <pubDate>Sun, 09 May 2010 20:02:50 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16422.html</guid>
   </item>
    <item>
      <title>[VOTE] Apache Nutch 1.1 Release Candidate #3</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16421.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/09&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Mattmann, Chris A (388J)%22&quot;&gt;Mattmann, Chris A (388J)&lt;/a&gt;</description>
      <pubDate>Sun, 09 May 2010 00:16:48 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16421.html</guid>
   </item>
    <item>
      <title>Re: Hi</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16420.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/07&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Harry Nutch%22&quot;&gt;Harry Nutch&lt;/a&gt;</description>
      <pubDate>Fri, 07 May 2010 00:53:32 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16420.html</guid>
   </item>
    <item>
      <title>Hi</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16419.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/06&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Zehra Göçer%22&quot;&gt;Zehra Göçer&lt;/a&gt;</description>
      <pubDate>Thu, 06 May 2010 18:00:47 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16419.html</guid>
   </item>
    <item>
      <title>Re: JobTracker gets stuck with DFS problems</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16418.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/06&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Emmanuel de Castro Santana%22&quot;&gt;Emmanuel de Castro Santana&lt;/a&gt;</description>
      <pubDate>Thu, 06 May 2010 15:14:25 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16418.html</guid>
   </item>
    <item>
      <title>parse-pdf plugin with external libraries</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16417.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/06&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Claudio Martella%22&quot;&gt;Claudio Martella&lt;/a&gt;</description>
      <pubDate>Thu, 06 May 2010 13:39:00 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16417.html</guid>
   </item>
    <item>
      <title>Re: nutch crawl issue</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16416.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/06&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22matthew a. grisius%22&quot;&gt;matthew a. grisius&lt;/a&gt;</description>
      <pubDate>Thu, 06 May 2010 05:02:07 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16416.html</guid>
   </item>
    <item>
      <title>Re: nutch crawl issue</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16415.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/05&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Julien Nioche%22&quot;&gt;Julien Nioche&lt;/a&gt;</description>
      <pubDate>Wed, 05 May 2010 08:36:53 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16415.html</guid>
   </item>
    <item>
      <title>Re: nutch crawl issue</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16414.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/05&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Mattmann, Chris A (388J)%22&quot;&gt;Mattmann, Chris A (388J)&lt;/a&gt;</description>
      <pubDate>Wed, 05 May 2010 04:51:03 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16414.html</guid>
   </item>
    <item>
      <title>Re: nutch crawl issue</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16413.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/05&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22matthew a. grisius%22&quot;&gt;matthew a. grisius&lt;/a&gt;</description>
      <pubDate>Wed, 05 May 2010 04:08:39 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16413.html</guid>
   </item>
    <item>
      <title>Parsing html</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16412.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/04&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22nachonieto3%22&quot;&gt;nachonieto3&lt;/a&gt;</description>
      <pubDate>Tue, 04 May 2010 15:55:28 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16412.html</guid>
   </item>
    <item>
      <title>Re: Parsing .ppt, .xls, .rtf and .doc</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16411.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/04&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22nachonieto3%22&quot;&gt;nachonieto3&lt;/a&gt;</description>
      <pubDate>Tue, 04 May 2010 15:51:47 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16411.html</guid>
   </item>
    <item>
      <title>Nutch crawled databases</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16410.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/04&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Renbyna%22&quot;&gt;Renbyna&lt;/a&gt;</description>
      <pubDate>Tue, 04 May 2010 15:20:13 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16410.html</guid>
   </item>
    <item>
      <title>Re: JobTracker gets stuck with DFS problems</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16409.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/03&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Andrzej Bialecki%22&quot;&gt;Andrzej Bialecki&lt;/a&gt;</description>
      <pubDate>Mon, 03 May 2010 21:16:52 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16409.html</guid>
   </item>
    <item>
      <title>Re: JobTracker gets stuck with DFS problems</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16408.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/03&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Emmanuel de Castro Santana%22&quot;&gt;Emmanuel de Castro Santana&lt;/a&gt;</description>
      <pubDate>Mon, 03 May 2010 20:58:44 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16408.html</guid>
   </item>
    <item>
      <title>Re: JobTracker gets stuck with DFS problems</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16407.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/03&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Andrzej Bialecki%22&quot;&gt;Andrzej Bialecki&lt;/a&gt;</description>
      <pubDate>Mon, 03 May 2010 20:48:48 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16407.html</guid>
   </item>
    <item>
      <title>No search results on Tomcat (java.lang.NullPointerException)</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16406.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/03&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Michael%22&quot;&gt;Michael&lt;/a&gt;</description>
      <pubDate>Mon, 03 May 2010 20:40:45 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16406.html</guid>
   </item>
    <item>
      <title>nutch java.lang.NullPointerException</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16405.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/03&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Michael R.%22&quot;&gt;Michael R.&lt;/a&gt;</description>
      <pubDate>Mon, 03 May 2010 20:40:27 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16405.html</guid>
   </item>
    <item>
      <title>Re: JobTracker gets stuck with DFS problems</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16404.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/03&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Emmanuel de Castro Santana%22&quot;&gt;Emmanuel de Castro Santana&lt;/a&gt;</description>
      <pubDate>Mon, 03 May 2010 17:59:48 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16404.html</guid>
   </item>
    <item>
      <title>Re: nutch crawl issue</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16403.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/03&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Mattmann, Chris A (388J)%22&quot;&gt;Mattmann, Chris A (388J)&lt;/a&gt;</description>
      <pubDate>Mon, 03 May 2010 16:24:46 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16403.html</guid>
   </item>
    <item>
      <title>Re: nutch crawl issue</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16402.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/03&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22matthew a. grisius%22&quot;&gt;matthew a. grisius&lt;/a&gt;</description>
      <pubDate>Mon, 03 May 2010 16:06:01 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16402.html</guid>
   </item>
    <item>
      <title>Re: nutch crawl issue</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16401.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/02&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Mattmann, Chris A (388J)%22&quot;&gt;Mattmann, Chris A (388J)&lt;/a&gt;</description>
      <pubDate>Sun, 02 May 2010 04:06:58 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16401.html</guid>
   </item>
    <item>
      <title>Re: nutch crawl issue</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16400.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/02&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22matthew a. grisius%22&quot;&gt;matthew a. grisius&lt;/a&gt;</description>
      <pubDate>Sun, 02 May 2010 03:14:26 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16400.html</guid>
   </item>
    <item>
      <title>Re: skip index directory in search results</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16399.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/01&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22b k%22&quot;&gt;b k&lt;/a&gt;</description>
      <pubDate>Sat, 01 May 2010 18:44:39 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16399.html</guid>
   </item>
    <item>
      <title>Re: getting malformed URL exception</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16398.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/01&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22b k%22&quot;&gt;b k&lt;/a&gt;</description>
      <pubDate>Sat, 01 May 2010 18:42:45 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16398.html</guid>
   </item>
    <item>
      <title>Re: Searching multiple directories</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16397.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/01&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22b k%22&quot;&gt;b k&lt;/a&gt;</description>
      <pubDate>Sat, 01 May 2010 18:37:26 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16397.html</guid>
   </item>
    <item>
      <title>getting malformed URL exception</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16396.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/01&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22arpit khurdiya%22&quot;&gt;arpit khurdiya&lt;/a&gt;</description>
      <pubDate>Sat, 01 May 2010 18:37:11 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16396.html</guid>
   </item>
    <item>
      <title>Re: why does nutch interpret directory as URL</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16395.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/01&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22b k%22&quot;&gt;b k&lt;/a&gt;</description>
      <pubDate>Sat, 01 May 2010 18:22:58 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16395.html</guid>
   </item>
    <item>
      <title>Re: [VOTE] Apache Nutch 1.1 Release Candidate #2</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16394.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/01&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Phil Barnett%22&quot;&gt;Phil Barnett&lt;/a&gt;</description>
      <pubDate>Sat, 01 May 2010 14:22:12 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16394.html</guid>
   </item>
    <item>
      <title>Re: [VOTE] Apache Nutch 1.1 Release Candidate #2</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16393.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/01&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Mattmann, Chris A (388J)%22&quot;&gt;Mattmann, Chris A (388J)&lt;/a&gt;</description>
      <pubDate>Sat, 01 May 2010 06:34:58 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16393.html</guid>
   </item>
    <item>
      <title>Re: nutch crawl issue</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16392.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/01&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Phil Barnett%22&quot;&gt;Phil Barnett&lt;/a&gt;</description>
      <pubDate>Sat, 01 May 2010 06:31:05 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16392.html</guid>
   </item>
    <item>
      <title>Re: [VOTE] Apache Nutch 1.1 Release Candidate #2</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16391.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/01&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Phil Barnett%22&quot;&gt;Phil Barnett&lt;/a&gt;</description>
      <pubDate>Sat, 01 May 2010 06:12:43 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16391.html</guid>
   </item>
    <item>
      <title>Re: [VOTE] Apache Nutch 1.1 Release Candidate #2</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16390.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/01&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Phil Barnett%22&quot;&gt;Phil Barnett&lt;/a&gt;</description>
      <pubDate>Sat, 01 May 2010 06:10:48 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16390.html</guid>
   </item>
    <item>
      <title>Re: [VOTE] Apache Nutch 1.1 Release Candidate #2</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16389.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/05/01&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Phil Barnett%22&quot;&gt;Phil Barnett&lt;/a&gt;</description>
      <pubDate>Sat, 01 May 2010 05:44:27 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16389.html</guid>
   </item>
    <item>
      <title>Re: JobTracker gets stuck with DFS problems</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16388.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/30&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Andrzej Bialecki%22&quot;&gt;Andrzej Bialecki&lt;/a&gt;</description>
      <pubDate>Fri, 30 Apr 2010 19:28:16 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16388.html</guid>
   </item>
    <item>
      <title>JobTracker gets stuck with DFS problems</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16387.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/30&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Emmanuel de Castro Santana%22&quot;&gt;Emmanuel de Castro Santana&lt;/a&gt;</description>
      <pubDate>Fri, 30 Apr 2010 18:10:26 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16387.html</guid>
   </item>
    <item>
      <title>Re:Search problem in nutch on eclipse (win XP)</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16386.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/29&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Harish Kumar%22&quot;&gt;Harish Kumar&lt;/a&gt;</description>
      <pubDate>Thu, 29 Apr 2010 18:20:07 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16386.html</guid>
   </item>
    <item>
      <title>Re: nutch crawl issue</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16385.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/29&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Julien Nioche%22&quot;&gt;Julien Nioche&lt;/a&gt;</description>
      <pubDate>Thu, 29 Apr 2010 17:36:58 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16385.html</guid>
   </item>
    <item>
      <title>Parsing .ppt, .xls, .rtf and .doc</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16384.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/29&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22nachonieto3%22&quot;&gt;nachonieto3&lt;/a&gt;</description>
      <pubDate>Thu, 29 Apr 2010 17:34:03 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16384.html</guid>
   </item>
    <item>
      <title>Re: why does nutch interpret directory as URL</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16383.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/29&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22arpit khurdiya%22&quot;&gt;arpit khurdiya&lt;/a&gt;</description>
      <pubDate>Thu, 29 Apr 2010 16:31:56 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16383.html</guid>
   </item>
    <item>
      <title>Re: nutch crawl issue</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16382.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/29&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22arpit khurdiya%22&quot;&gt;arpit khurdiya&lt;/a&gt;</description>
      <pubDate>Thu, 29 Apr 2010 16:28:10 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16382.html</guid>
   </item>
    <item>
      <title>Re: nutch crawl issue</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16381.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/29&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22matthew a. grisius%22&quot;&gt;matthew a. grisius&lt;/a&gt;</description>
      <pubDate>Thu, 29 Apr 2010 16:04:12 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16381.html</guid>
   </item>
    <item>
      <title>Re: why does nutch interpret directory as URL</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16380.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/29&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22xiao yang%22&quot;&gt;xiao yang&lt;/a&gt;</description>
      <pubDate>Thu, 29 Apr 2010 04:30:17 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16380.html</guid>
   </item>
    <item>
      <title>why does nutch interpret directory as URL</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16379.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/28&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22BK%22&quot;&gt;BK&lt;/a&gt;</description>
      <pubDate>Wed, 28 Apr 2010 20:34:09 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16379.html</guid>
   </item>
    <item>
      <title>Fwd: Call for Participation: Technical Talks -- ApacheCon North America 2010</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16378.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/28&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Grant Ingersoll%22&quot;&gt;Grant Ingersoll&lt;/a&gt;</description>
      <pubDate>Wed, 28 Apr 2010 18:48:28 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16378.html</guid>
   </item>
    <item>
      <title>skip index directory in search results</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16377.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/28&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22BK%22&quot;&gt;BK&lt;/a&gt;</description>
      <pubDate>Wed, 28 Apr 2010 17:55:37 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16377.html</guid>
   </item>
    <item>
      <title>Re: Call for Participation: Technical Talks -- ApacheCon North America 2010</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16376.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/28&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Grant Ingersoll%22&quot;&gt;Grant Ingersoll&lt;/a&gt;</description>
      <pubDate>Wed, 28 Apr 2010 17:54:53 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16376.html</guid>
   </item>
    <item>
      <title>Re: [VOTE] Apache Nutch 1.1 Release Candidate #2</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16375.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/28&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Mattmann, Chris A (388J)%22&quot;&gt;Mattmann, Chris A (388J)&lt;/a&gt;</description>
      <pubDate>Wed, 28 Apr 2010 15:04:59 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16375.html</guid>
   </item>
    <item>
      <title>Re: [VOTE] Apache Nutch 1.1 Release Candidate #2</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16374.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/28&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Mattmann, Chris A (388J)%22&quot;&gt;Mattmann, Chris A (388J)&lt;/a&gt;</description>
      <pubDate>Wed, 28 Apr 2010 15:01:49 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16374.html</guid>
   </item>
    <item>
      <title>Re: [VOTE] Apache Nutch 1.1 Release Candidate #2</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16373.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/28&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22matthew a. grisius%22&quot;&gt;matthew a. grisius&lt;/a&gt;</description>
      <pubDate>Wed, 28 Apr 2010 14:28:56 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16373.html</guid>
   </item>
    <item>
      <title>Re: nutch crawl issue</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16372.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/28&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22matthew a. grisius%22&quot;&gt;matthew a. grisius&lt;/a&gt;</description>
      <pubDate>Wed, 28 Apr 2010 14:03:30 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16372.html</guid>
   </item>
    <item>
      <title>Problem with Standard analyzer</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16371.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/28&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Srinivas Gokavarapu%22&quot;&gt;Srinivas Gokavarapu&lt;/a&gt;</description>
      <pubDate>Wed, 28 Apr 2010 11:35:44 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16371.html</guid>
   </item>
    <item>
      <title>Re: [VOTE] Apache Nutch 1.1 Release Candidate #2</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16370.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/28&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Phil Barnett%22&quot;&gt;Phil Barnett&lt;/a&gt;</description>
      <pubDate>Wed, 28 Apr 2010 11:00:14 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16370.html</guid>
   </item>
    <item>
      <title>nutch crawl issue</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16369.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/28&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22matthew a. grisius%22&quot;&gt;matthew a. grisius&lt;/a&gt;</description>
      <pubDate>Wed, 28 Apr 2010 04:40:44 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16369.html</guid>
   </item>
    <item>
      <title>Issues in recrawling</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16368.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/27&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22arpit khurdiya%22&quot;&gt;arpit khurdiya&lt;/a&gt;</description>
      <pubDate>Tue, 27 Apr 2010 17:57:39 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16368.html</guid>
   </item>
    <item>
      <title>Problem while updating crawldb from segments directory</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16367.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/27&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22hareesh%22&quot;&gt;hareesh&lt;/a&gt;</description>
      <pubDate>Tue, 27 Apr 2010 08:08:34 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16367.html</guid>
   </item>
    <item>
      <title>Re: Hadoop Disk Error</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16366.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/27&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Andrzej Bialecki%22&quot;&gt;Andrzej Bialecki&lt;/a&gt;</description>
      <pubDate>Tue, 27 Apr 2010 07:34:49 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16366.html</guid>
   </item>
    <item>
      <title>Re: Hadoop Disk Error</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16365.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/26&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Joshua J Pavel%22&quot;&gt;Joshua J Pavel&lt;/a&gt;</description>
      <pubDate>Mon, 26 Apr 2010 20:32:02 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16365.html</guid>
   </item>
    <item>
      <title>Re: Running ANT; was -- Re: [VOTE] Apache Nutch 1.1 Release Candidate #2</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16364.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/26&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Andrzej Bialecki%22&quot;&gt;Andrzej Bialecki&lt;/a&gt;</description>
      <pubDate>Mon, 26 Apr 2010 19:09:03 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16364.html</guid>
   </item>
    <item>
      <title>Re: Running ANT; was -- Re: [VOTE] Apache Nutch 1.1 Release Candidate #2</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16363.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/26&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Mattmann, Chris A (388J)%22&quot;&gt;Mattmann, Chris A (388J)&lt;/a&gt;</description>
      <pubDate>Mon, 26 Apr 2010 15:30:40 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16363.html</guid>
   </item>
    <item>
      <title>Searching multiple directories</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16362.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/26&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22BK%22&quot;&gt;BK&lt;/a&gt;</description>
      <pubDate>Mon, 26 Apr 2010 15:24:34 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16362.html</guid>
   </item>
    <item>
      <title>Re: Lucandra - Lucene/Solr on Cassandra: April 26, NYC</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16361.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/26&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Utku Can Topçu%22&quot;&gt;Utku Can Topçu&lt;/a&gt;</description>
      <pubDate>Mon, 26 Apr 2010 15:23:30 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16361.html</guid>
   </item>
    <item>
      <title>Re: [VOTE] Apache Nutch 1.1 Release Candidate #2</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16360.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/26&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Mattmann, Chris A (388J)%22&quot;&gt;Mattmann, Chris A (388J)&lt;/a&gt;</description>
      <pubDate>Mon, 26 Apr 2010 15:19:45 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16360.html</guid>
   </item>
    <item>
      <title>Re: Running ANT; was -- Re: [VOTE] Apache Nutch 1.1 Release Candidate #2</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16359.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/26&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Andrzej Bialecki%22&quot;&gt;Andrzej Bialecki&lt;/a&gt;</description>
      <pubDate>Mon, 26 Apr 2010 15:15:16 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16359.html</guid>
   </item>
    <item>
      <title>Re: Running ANT; was -- Re: [VOTE] Apache Nutch 1.1 Release Candidate #2</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16358.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/26&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Mattmann, Chris A (388J)%22&quot;&gt;Mattmann, Chris A (388J)&lt;/a&gt;</description>
      <pubDate>Mon, 26 Apr 2010 15:13:34 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16358.html</guid>
   </item>
    <item>
      <title>Running ANT; was -- Re: [VOTE] Apache Nutch 1.1 Release Candidate #2</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16357.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/26&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22David M. Cole%22&quot;&gt;David M. Cole&lt;/a&gt;</description>
      <pubDate>Mon, 26 Apr 2010 14:52:06 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16357.html</guid>
   </item>
    <item>
      <title>Re: ANNOUNCE: Nutch becomes an Apache Top-Level Project (TLP)</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16356.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/26&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Ashumeet Singh%22&quot;&gt;Ashumeet Singh&lt;/a&gt;</description>
      <pubDate>Mon, 26 Apr 2010 14:26:13 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16356.html</guid>
   </item>
    <item>
      <title>ANNOUNCE: Nutch becomes an Apache Top-Level Project (TLP)</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16355.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/26&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Andrzej Bialecki%22&quot;&gt;Andrzej Bialecki&lt;/a&gt;</description>
      <pubDate>Mon, 26 Apr 2010 12:57:30 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16355.html</guid>
   </item>
    <item>
      <title>Re: [VOTE] Apache Nutch 1.1 Release Candidate #2</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16354.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/26&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Grant Ingersoll%22&quot;&gt;Grant Ingersoll&lt;/a&gt;</description>
      <pubDate>Mon, 26 Apr 2010 12:34:37 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16354.html</guid>
   </item>
    <item>
      <title>Re: How to do faceting on data indexed by Nutch</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16353.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/26&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Alvaro Cabrerizo%22&quot;&gt;Alvaro Cabrerizo&lt;/a&gt;</description>
      <pubDate>Mon, 26 Apr 2010 11:31:20 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16353.html</guid>
   </item>
    <item>
      <title>[VOTE] Apache Nutch 1.1 Release Candidate #2</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16352.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/26&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Mattmann, Chris A (388J)%22&quot;&gt;Mattmann, Chris A (388J)&lt;/a&gt;</description>
      <pubDate>Mon, 26 Apr 2010 05:56:33 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16352.html</guid>
   </item>
    <item>
      <title>Separate Nutch(crawl) and Lucene (index/search)</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16351.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/25&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22sb101h%22&quot;&gt;sb101h&lt;/a&gt;</description>
      <pubDate>Sun, 25 Apr 2010 18:25:05 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16351.html</guid>
   </item>
    <item>
      <title>Re: How to do faceting on data indexed by Nutch</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16350.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/25&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Andrzej Bialecki%22&quot;&gt;Andrzej Bialecki&lt;/a&gt;</description>
      <pubDate>Sun, 25 Apr 2010 18:24:17 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16350.html</guid>
   </item>
    <item>
      <title>How to do faceting on data indexed by Nutch</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16349.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/25&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22KK%22&quot;&gt;KK&lt;/a&gt;</description>
      <pubDate>Sun, 25 Apr 2010 13:04:26 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16349.html</guid>
   </item>
    <item>
      <title>Web Service on Nutch</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16348.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/25&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Kim Theng Chong%22&quot;&gt;Kim Theng Chong&lt;/a&gt;</description>
      <pubDate>Sun, 25 Apr 2010 07:42:30 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16348.html</guid>
   </item>
    <item>
      <title>RE: Is there some arbitrary limit on content stored for use by summaries?</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16347.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/23&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Tim Redding%22&quot;&gt;Tim Redding&lt;/a&gt;</description>
      <pubDate>Fri, 23 Apr 2010 09:50:17 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16347.html</guid>
   </item>
    <item>
      <title>Re: how to parse html files while crawling</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16346.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/23&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22cefurkan0 cefurkan0%22&quot;&gt;cefurkan0 cefurkan0&lt;/a&gt;</description>
      <pubDate>Fri, 23 Apr 2010 01:09:55 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16346.html</guid>
   </item>
    <item>
      <title>RE: Language specifications</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16345.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/22&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Arkadi.Kosmynin%22&quot;&gt;Arkadi.Kosmynin&lt;/a&gt;</description>
      <pubDate>Thu, 22 Apr 2010 22:33:26 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16345.html</guid>
   </item>
    <item>
      <title>Language specifications</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16344.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/22&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Joshua J Pavel%22&quot;&gt;Joshua J Pavel&lt;/a&gt;</description>
      <pubDate>Thu, 22 Apr 2010 20:57:12 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16344.html</guid>
   </item>
    <item>
      <title>Re: Is there some arbitrary limit on content stored for use by 	summaries?</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16343.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/22&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Julien Nioche%22&quot;&gt;Julien Nioche&lt;/a&gt;</description>
      <pubDate>Thu, 22 Apr 2010 20:56:54 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16343.html</guid>
   </item>
    <item>
      <title>RE: Is there some arbitrary limit on content stored for use by summaries?</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16342.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/22&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Tim Redding%22&quot;&gt;Tim Redding&lt;/a&gt;</description>
      <pubDate>Thu, 22 Apr 2010 17:44:38 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16342.html</guid>
   </item>
    <item>
      <title>Lucandra - Lucene/Solr on Cassandra: April 26, NYC</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16341.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/22&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Otis Gospodnetic%22&quot;&gt;Otis Gospodnetic&lt;/a&gt;</description>
      <pubDate>Thu, 22 Apr 2010 16:52:00 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16341.html</guid>
   </item>
    <item>
      <title>Re: Scheduler questions, 1.1 nightly build.</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16340.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/22&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Phil Barnett%22&quot;&gt;Phil Barnett&lt;/a&gt;</description>
      <pubDate>Thu, 22 Apr 2010 09:05:02 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16340.html</guid>
   </item>
    <item>
      <title>Scheduler questions, 1.1 nightly build.</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16339.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/22&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Phil Barnett%22&quot;&gt;Phil Barnett&lt;/a&gt;</description>
      <pubDate>Thu, 22 Apr 2010 08:59:57 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16339.html</guid>
   </item>
    <item>
      <title>Re: Format of the Nutch Results</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16338.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/22&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22nachonieto3%22&quot;&gt;nachonieto3&lt;/a&gt;</description>
      <pubDate>Thu, 22 Apr 2010 08:37:54 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16338.html</guid>
   </item>
    <item>
      <title>Re: Format of the Nutch Results</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16337.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/22&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Harry Nutch%22&quot;&gt;Harry Nutch&lt;/a&gt;</description>
      <pubDate>Thu, 22 Apr 2010 01:54:06 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16337.html</guid>
   </item>
    <item>
      <title>Re: AbstractMethodError for cyberneko parser</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16336.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/22&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Harry Nutch%22&quot;&gt;Harry Nutch&lt;/a&gt;</description>
      <pubDate>Thu, 22 Apr 2010 01:44:06 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16336.html</guid>
   </item>
    <item>
      <title>April Seattle Hadoop/Scalability/NoSQL Meetup: Cassandra, Science, 	More!</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16335.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/21&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Bradford Stephens%22&quot;&gt;Bradford Stephens&lt;/a&gt;</description>
      <pubDate>Wed, 21 Apr 2010 22:38:21 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16335.html</guid>
   </item>
    <item>
      <title>RE: Is there some arbitrary limit on content stored for use by summaries?</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16334.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/21&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Arkadi.Kosmynin%22&quot;&gt;Arkadi.Kosmynin&lt;/a&gt;</description>
      <pubDate>Wed, 21 Apr 2010 22:29:33 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16334.html</guid>
   </item>
    <item>
      <title>Re: nutch says No URLs to fetch - check your seed list and URL 	filters when trying to index fmforums.com</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16333.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/21&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22joshua paul%22&quot;&gt;joshua paul&lt;/a&gt;</description>
      <pubDate>Wed, 21 Apr 2010 19:03:15 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16333.html</guid>
   </item>
    <item>
      <title>Re: Hadoop Disk Error</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16332.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/21&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Joshua J Pavel%22&quot;&gt;Joshua J Pavel&lt;/a&gt;</description>
      <pubDate>Wed, 21 Apr 2010 17:57:12 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16332.html</guid>
   </item>
    <item>
      <title>specify nutchConfiguration File</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16331.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/21&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Jan Philippe Wimmer%22&quot;&gt;Jan Philippe Wimmer&lt;/a&gt;</description>
      <pubDate>Wed, 21 Apr 2010 16:19:15 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16331.html</guid>
   </item>
    <item>
      <title>Is there some arbitrary limit on content stored for use by summaries?</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16330.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/21&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Tim Redding%22&quot;&gt;Tim Redding&lt;/a&gt;</description>
      <pubDate>Wed, 21 Apr 2010 16:19:00 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16330.html</guid>
   </item>
    <item>
      <title>Re: Hadoop Disk Error</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16329.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/21&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Julien Nioche%22&quot;&gt;Julien Nioche&lt;/a&gt;</description>
      <pubDate>Wed, 21 Apr 2010 14:43:51 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16329.html</guid>
   </item>
    <item>
      <title>RE: Hadoop Disk Error</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16328.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/21&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22Joshua J Pavel%22&quot;&gt;Joshua J Pavel&lt;/a&gt;</description>
      <pubDate>Wed, 21 Apr 2010 14:29:22 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16328.html</guid>
   </item>
    <item>
      <title>Re: how to parse html files while crawling</title>
      <link>http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16327.html</link>
      <description>&lt;font color=#6f6f6f&gt; 2010/04/21&lt;/font&gt; -- &lt;a href=&quot;http://www.mail-archive.com/search?l=nutch-user@lucene.apache.org&amp;q=from:%22nachonieto3%22&quot;&gt;nachonieto3&lt;/a&gt;</description>
      <pubDate>Wed, 21 Apr 2010 13:39:04 GMT</pubDate>
      <guid isPermaLink="true">http://www.mail-archive.com/nutch-user@lucene.apache.org/msg16327.html</guid>
   </item>
 
  </channel>
  </rss>
<!-- MHonArc v2.6.16+ -->

