Help !!! My production environment is blocked by this error. I deleted the segment altogether and restarted crawl/fetch/parse... and I'm still stuck, so I can not add segments anymore. Looking like a hdfs problem ???
2010-01-18 19:53:00,785 WARN hdfs.DFSClient - DFS Read: java.io.IOException: Could not obtain block: blk_-6931814167688802826_9735 file=/user/root/crawl/indexed-segments/20100117235244/part-00000/_1lr.prx at org.apache.hadoop.hdfs.DFSClient$DFSInputStream.chooseDataNode(DFSClient.java:1707) at org.apache.hadoop.hdfs.DFSClient$DFSInputStream.blockSeekTo(DFSClient.java:1535) at org.apache.hadoop.hdfs.DFSClient$DFSInputStream.read(DFSClient.java:1662) at java.io.DataInputStream.read(DataInputStream.java:149) at org.apache.nutch.indexer.FsDirectory$DfsIndexInput.readInternal(FsDirectory.java:178) at org.apache.lucene.store.BufferedIndexInput.refill(BufferedIndexInput.java:157) at org.apache.lucene.store.BufferedIndexInput.readByte(BufferedIndexInput.java:38) at org.apache.lucene.store.IndexInput.readVInt(IndexInput.java:78) at org.apache.lucene.index.SegmentTermPositions.readDeltaPosition(SegmentTermPositions.java:73) at org.apache.lucene.index.SegmentTermPositions.nextPosition(SegmentTermPositions.java:69) at org.apache.lucene.index.SegmentMerger.appendPostings(SegmentMerger.java:667) at org.apache.lucene.index.SegmentMerger.mergeTermInfo(SegmentMerger.java:586) at org.apache.lucene.index.SegmentMerger.mergeTermInfos(SegmentMerger.java:547) at org.apache.lucene.index.SegmentMerger.mergeTerms(SegmentMerger.java:500) at org.apache.lucene.index.SegmentMerger.merge(SegmentMerger.java:140) at org.apache.lucene.index.IndexWriter.mergeMiddle(IndexWriter.java:4226) at org.apache.lucene.index.IndexWriter.merge(IndexWriter.java:3877) at org.apache.lucene.index.ConcurrentMergeScheduler.doMerge(ConcurrentMergeScheduler.java:205) at org.apache.lucene.index.ConcurrentMergeScheduler$MergeThread.run(ConcurrentMergeScheduler.java:260) 2010-01-18 19:53:01,210 FATAL indexer.IndexMerger - IndexMerger: java.io.IOException: background merge hit exception: _2q:Cx4844 _5z:Cx10544 _ko:Cx36459 _q5:Cx46128 _l8:Cx37407 _t4:Cx51363 _1sv:Cx114442 _ek:Cx25656 _9d:Cx16546 _ad:Cx18255 _kp:Cx36539 _s0:Cx49395 _ny:Cx42237 _l7:Cx37392 _6s:Cx11976 _7k:Cx13326 _h7:Cx30314 _oe:Cx43029 _uq:Cx54179 _xi:Cx59085 _112:Cx65398 _141:Cx70607 _15h:Cx73181 _17c:Cx76450 _16i:Cx74951 _182:Cx77703 _150:Cx72344 _15e:Cx73047 _14e:Cx71203 _15f:Cx73078 _149:Cx71025 _155:Cx72571 _1n2:Cx104197 _1o4:Cx106042 _1ea:Cx88687 _17o:Cx77042 _18f:Cx78392 _1ds:Cx87839 _141:Cx70632 _103:Cx63684 _ym:Cx61086 _1lr:Cx101890 into _0 [optimize] at org.apache.lucene.index.IndexWriter.optimize(IndexWriter.java:2258) at org.apache.lucene.index.IndexWriter.optimize(IndexWriter.java:2203) at org.apache.lucene.index.IndexWriter.optimize(IndexWriter.java:2183) at org.apache.lucene.index.IndexWriter.addIndexes(IndexWriter.java:2877) at org.apache.nutch.indexer.IndexMerger.merge(IndexMerger.java:97) at org.apache.nutch.indexer.IndexMerger.run(IndexMerger.java:149) at org.apache.hadoop.util.ToolRunner.run(ToolRunner.java:65) at org.apache.nutch.indexer.IndexMerger.main(IndexMerger.java:111) Caused by: java.io.IOException: Could not obtain block: blk_-6931814167688802826_9735 file=/user/root/crawl/indexed-segments/20100117235244/part-00000/_1lr.prx at org.apache.hadoop.hdfs.DFSClient$DFSInputStream.chooseDataNode(DFSClient.java:1707) at org.apache.hadoop.hdfs.DFSClient$DFSInputStream.blockSeekTo(DFSClient.java:1535) at org.apache.hadoop.hdfs.DFSClient$DFSInputStream.read(DFSClient.java:1662) at java.io.DataInputStream.read(DataInputStream.java:149) at org.apache.nutch.indexer.FsDirectory$DfsIndexInput.readInternal(FsDirectory.java:178) at org.apache.lucene.store.BufferedIndexInput.refill(BufferedIndexInput.java:157) at org.apache.lucene.store.BufferedIndexInput.readByte(BufferedIndexInput.java:38) at org.apache.lucene.store.IndexInput.readVInt(IndexInput.java:78) at org.apache.lucene.index.SegmentTermPositions.readDeltaPosition(SegmentTermPositions.java:73) at org.apache.lucene.index.SegmentTermPositions.nextPosition(SegmentTermPositions.java:69) at org.apache.lucene.index.SegmentMerger.appendPostings(SegmentMerger.java:667) at org.apache.lucene.index.SegmentMerger.mergeTermInfo(SegmentMerger.java:586) at org.apache.lucene.index.SegmentMerger.mergeTermInfos(SegmentMerger.java:547) at org.apache.lucene.index.SegmentMerger.mergeTerms(SegmentMerger.java:500) at org.apache.lucene.index.SegmentMerger.merge(SegmentMerger.java:140) at org.apache.lucene.index.IndexWriter.mergeMiddle(IndexWriter.java:4226) at org.apache.lucene.index.IndexWriter.merge(IndexWriter.java:3877) at org.apache.lucene.index.ConcurrentMergeScheduler.doMerge(ConcurrentMergeScheduler.java:205) at org.apache.lucene.index.ConcurrentMergeScheduler$MergeThread.run(ConcurrentMergeScheduler.java:260) -- -MilleBii-