Author: siren Date: Tue Jun 20 12:54:09 2006 New Revision: 415784 URL: http://svn.apache.org/viewvc?rev=415784&view=rev Log: NUTCH-292 fix summarizer oom
Modified: lucene/nutch/trunk/src/plugin/summary-basic/src/java/org/apache/nutch/summary/basic/BasicSummarizer.java Modified: lucene/nutch/trunk/src/plugin/summary-basic/src/java/org/apache/nutch/summary/basic/BasicSummarizer.java URL: http://svn.apache.org/viewvc/lucene/nutch/trunk/src/plugin/summary-basic/src/java/org/apache/nutch/summary/basic/BasicSummarizer.java?rev=415784&r1=415783&r2=415784&view=diff ============================================================================== --- lucene/nutch/trunk/src/plugin/summary-basic/src/java/org/apache/nutch/summary/basic/BasicSummarizer.java (original) +++ lucene/nutch/trunk/src/plugin/summary-basic/src/java/org/apache/nutch/summary/basic/BasicSummarizer.java Tue Jun 20 12:54:09 2006 @@ -285,7 +285,9 @@ * </implementation:Summarizer> * * ---------------------------- */ - + /** Maximun number of tokens inspect in a summary . */ + private static final int token_deep = 2000; + /** * Class Excerpt represents a single passage found in the document, with some * appropriate regions highlit. @@ -354,7 +356,7 @@ ArrayList result = new ArrayList(); TokenStream ts = analyzer.tokenStream("content", new StringReader(text)); Token token = null; - while (true) { + while (result.size()<token_deep) { try { token = ts.next(); } catch (IOException e) { _______________________________________________ Nutch-cvs mailing list Nutch-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/nutch-cvs