Author: siren
Date: Tue Jun 20 12:54:09 2006
New Revision: 415784

URL: http://svn.apache.org/viewvc?rev=415784&view=rev
Log:
NUTCH-292 fix summarizer oom

Modified:
    
lucene/nutch/trunk/src/plugin/summary-basic/src/java/org/apache/nutch/summary/basic/BasicSummarizer.java

Modified: 
lucene/nutch/trunk/src/plugin/summary-basic/src/java/org/apache/nutch/summary/basic/BasicSummarizer.java
URL: 
http://svn.apache.org/viewvc/lucene/nutch/trunk/src/plugin/summary-basic/src/java/org/apache/nutch/summary/basic/BasicSummarizer.java?rev=415784&r1=415783&r2=415784&view=diff
==============================================================================
--- 
lucene/nutch/trunk/src/plugin/summary-basic/src/java/org/apache/nutch/summary/basic/BasicSummarizer.java
 (original)
+++ 
lucene/nutch/trunk/src/plugin/summary-basic/src/java/org/apache/nutch/summary/basic/BasicSummarizer.java
 Tue Jun 20 12:54:09 2006
@@ -285,7 +285,9 @@
    * </implementation:Summarizer> *
    * ---------------------------- */
   
-  
+  /** Maximun number of tokens inspect in a summary . */
+  private static final int token_deep = 2000;
+
   /**
    * Class Excerpt represents a single passage found in the document, with some
    * appropriate regions highlit.
@@ -354,7 +356,7 @@
     ArrayList result = new ArrayList();
     TokenStream ts = analyzer.tokenStream("content", new StringReader(text));
     Token token = null;
-    while (true) {
+    while (result.size()<token_deep) {
       try {
         token = ts.next();
       } catch (IOException e) {




_______________________________________________
Nutch-cvs mailing list
Nutch-cvs@lists.sourceforge.net
https://lists.sourceforge.net/lists/listinfo/nutch-cvs

Reply via email to