Author: srowen
Date: Mon Apr 18 21:45:27 2011
New Revision: 1094781
URL: http://svn.apache.org/viewvc?rev=1094781&view=rev
Log:
MAHOUT-675 just warn about docs with no term freq vector
Modified:
mahout/trunk/utils/src/main/java/org/apache/mahout/utils/vectors/lucene/LuceneIterator.java
Modified:
mahout/trunk/utils/src/main/java/org/apache/mahout/utils/vectors/lucene/LuceneIterator.java
URL:
http://svn.apache.org/viewvc/mahout/trunk/utils/src/main/java/org/apache/mahout/utils/vectors/lucene/LuceneIterator.java?rev=1094781&r1=1094780&r2=1094781&view=diff
==============================================================================
---
mahout/trunk/utils/src/main/java/org/apache/mahout/utils/vectors/lucene/LuceneIterator.java
(original)
+++
mahout/trunk/utils/src/main/java/org/apache/mahout/utils/vectors/lucene/LuceneIterator.java
Mon Apr 18 21:45:27 2011
@@ -30,6 +30,8 @@ import org.apache.lucene.index.TermDocs;
import org.apache.lucene.index.TermFreqVector;
import org.apache.mahout.math.NamedVector;
import org.apache.mahout.math.Vector;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
/**
* An {@link Iterator} over {@link Vector}s that uses a Lucene index as the
source for creating the
@@ -37,6 +39,8 @@ import org.apache.mahout.math.Vector;
*/
public final class LuceneIterator extends AbstractIterator<Vector> {
+ private static final Logger log =
LoggerFactory.getLogger(LuceneIterator.class);
+
private final IndexReader indexReader;
private final String field;
private final String idField;
@@ -82,7 +86,8 @@ public final class LuceneIterator extend
int doc = termDocs.doc();
TermFreqVector termFreqVector = indexReader.getTermFreqVector(doc,
field);
if (termFreqVector == null) {
- throw new IllegalStateException("Field '" + field + "' does not have
term vectors");
+ log.warn(indexReader.document(doc).get(idField) + " does not have a
term vector for " + field);
+ computeNext();
}
indexReader.getTermFreqVector(doc, field, mapper);