Author: dogacan Date: Thu Jul 26 01:10:38 2007 New Revision: 559742 URL: http://svn.apache.org/viewvc?view=rev&rev=559742 Log: NUTCH-516 - Next fetch time is not set when it is a CrawlDatum.STATUS_FETCH_GONE. Contributed by Emmanuel Joke.
Modified: lucene/nutch/trunk/CHANGES.txt lucene/nutch/trunk/src/java/org/apache/nutch/crawl/AbstractFetchSchedule.java lucene/nutch/trunk/src/java/org/apache/nutch/crawl/DefaultFetchSchedule.java Modified: lucene/nutch/trunk/CHANGES.txt URL: http://svn.apache.org/viewvc/lucene/nutch/trunk/CHANGES.txt?view=diff&rev=559742&r1=559741&r2=559742 ============================================================================== --- lucene/nutch/trunk/CHANGES.txt (original) +++ lucene/nutch/trunk/CHANGES.txt Thu Jul 26 01:10:38 2007 @@ -96,6 +96,9 @@ 32. NUTCH-518 - Fix OpicScoringFilter to respect scoring filter chaining. (Enis Soztutar via dogacan) +33. NUTCH-516 - Next fetch time is not set when it is a + CrawlDatum.STATUS_FETCH_GONE. (Emmanuel Joke via dogacan) + Release 0.9 - 2007-04-02 1. Changed log4j confiquration to log to stdout on commandline Modified: lucene/nutch/trunk/src/java/org/apache/nutch/crawl/AbstractFetchSchedule.java URL: http://svn.apache.org/viewvc/lucene/nutch/trunk/src/java/org/apache/nutch/crawl/AbstractFetchSchedule.java?view=diff&rev=559742&r1=559741&r2=559742 ============================================================================== --- lucene/nutch/trunk/src/java/org/apache/nutch/crawl/AbstractFetchSchedule.java (original) +++ lucene/nutch/trunk/src/java/org/apache/nutch/crawl/AbstractFetchSchedule.java Thu Jul 26 01:10:38 2007 @@ -91,6 +91,7 @@ // no page is truly GONE ... just increase the interval by 50% // and try much later. datum.setFetchInterval(datum.getFetchInterval() * 1.5f); + datum.setFetchTime(fetchTime + Math.round(datum.getFetchInterval() * 1000.0d)); if (maxInterval < datum.getFetchInterval()) forceRefetch(url, datum, false); return datum; } Modified: lucene/nutch/trunk/src/java/org/apache/nutch/crawl/DefaultFetchSchedule.java URL: http://svn.apache.org/viewvc/lucene/nutch/trunk/src/java/org/apache/nutch/crawl/DefaultFetchSchedule.java?view=diff&rev=559742&r1=559741&r2=559742 ============================================================================== --- lucene/nutch/trunk/src/java/org/apache/nutch/crawl/DefaultFetchSchedule.java (original) +++ lucene/nutch/trunk/src/java/org/apache/nutch/crawl/DefaultFetchSchedule.java Thu Jul 26 01:10:38 2007 @@ -32,7 +32,7 @@ public CrawlDatum setFetchSchedule(Text url, CrawlDatum datum, long prevFetchTime, long prevModifiedTime, long fetchTime, long modifiedTime, int state) { - datum.setFetchTime(fetchTime + Math.round(datum.getFetchInterval() * 1000.0f)); + datum.setFetchTime(fetchTime + Math.round(datum.getFetchInterval() * 1000.0d)); datum.setModifiedTime(modifiedTime); return datum; }