Index: src/java/org/apache/nutch/crawl/AbstractFetchSchedule.java
===================================================================
--- src/java/org/apache/nutch/crawl/AbstractFetchSchedule.java (Revision 886112)
+++ src/java/org/apache/nutch/crawl/AbstractFetchSchedule.java (Arbeitskopie)
@@ -145,7 +145,7 @@
* included in the further selection process based on scores. The default
* implementation checks fetchTime
, if it is higher than the
* {@param curTime} it returns false, and true otherwise. It will also
- * check that fetchTime is not too remote (more than maxInterval
maxInterval,
* in which case it lowers the interval and returns true.
* @param url URL of the page
* @param datum datum instance
Index: src/java/org/apache/nutch/crawl/DefaultFetchSchedule.java
===================================================================
--- src/java/org/apache/nutch/crawl/DefaultFetchSchedule.java (Revision 886112)
+++ src/java/org/apache/nutch/crawl/DefaultFetchSchedule.java (Arbeitskopie)
@@ -35,6 +35,9 @@
long fetchTime, long modifiedTime, int state) {
datum = super.setFetchSchedule(url, datum, prevFetchTime, prevModifiedTime,
fetchTime, modifiedTime, state);
+ if (datum.getFetchInterval() == 0 ) {
+ datum.setFetchInterval(defaultInterval);
+ }
datum.setFetchTime(fetchTime + (long)datum.getFetchInterval() * 1000);
datum.setModifiedTime(modifiedTime);
return datum;