Hi, Andrzej,
SegmentReader.java fails when option -nocontent, etc. are on.
Attached is a patch. If looks okay, I will commit it with my other
patch for ndfs tomorrow.
John
--- ./nutch-cvs-20041215/src/java/net/nutch/segment/SegmentReader.java
2004-12-05 01:43:48.000000000 -0800
+++ ./nutch-cvs-20041215.xing/src/java/net/nutch/segment/SegmentReader.java
2004-12-16 17:09:29.000000000 -0800
@@ -335,9 +335,13 @@
while(next(fo, co, pt, pd)) {
output.println("Recno:: " + recNo++);
output.println("FetcherOutput::\n" + fo.toString());
- output.println("Content::\n" + co.toString());
- output.println("ParseData::\n" + pd.toString());
- output.println("ParseText::\n" + pt.toString() + "\n");
+ if (contentReader != null)
+ output.println("Content::\n" + co.toString());
+ if (parseDataReader != null)
+ output.println("ParseData::\n" + pd.toString());
+ if (parseTextReader != null)
+ output.println("ParseText::\n" + pt.toString());
+ output.println("");
}
} else {
File unsortedFile = new File(segmentDir, ".unsorted");
@@ -378,9 +382,13 @@
get(recNo, fo, co, pt, pd);
output.println("Recno:: " + recNo++);
output.println("FetcherOutput::\n" + fo.toString());
- output.println("Content::\n" + co.toString());
- output.println("ParseData::\n" + pd.toString());
- output.println("ParseText::\n" + pt.toString() + "\n");
+ if (contentReader != null)
+ output.println("Content::\n" + co.toString());
+ if (parseDataReader != null)
+ output.println("ParseData::\n" + pd.toString());
+ if (parseTextReader != null)
+ output.println("ParseText::\n" + pt.toString());
+ output.println("");
}
seqReader.close();
nfs.delete(sortedFile);