Author: cutting
Date: Thu Jun  2 12:05:24 2005
New Revision: 179628

URL: http://svn.apache.org/viewcvs?rev=179628&view=rev
Log:
Fix so that stop words are not removed when they're field-qualified.

Modified:
    incubator/nutch/trunk/src/java/org/apache/nutch/analysis/NutchAnalysis.java
    incubator/nutch/trunk/src/java/org/apache/nutch/analysis/NutchAnalysis.jj

Modified: 
incubator/nutch/trunk/src/java/org/apache/nutch/analysis/NutchAnalysis.java
URL: 
http://svn.apache.org/viewcvs/incubator/nutch/trunk/src/java/org/apache/nutch/analysis/NutchAnalysis.java?rev=179628&r1=179627&r2=179628&view=diff
==============================================================================
--- incubator/nutch/trunk/src/java/org/apache/nutch/analysis/NutchAnalysis.java 
(original)
+++ incubator/nutch/trunk/src/java/org/apache/nutch/analysis/NutchAnalysis.java 
Thu Jun  2 12:05:24 2005
@@ -122,8 +122,11 @@
       nonOpOrTerm();
       String[] array = (String[])terms.toArray(new String[terms.size()]);
 
-      if (stop && terms.size()==1 && isStopWord(array[0])) {
-        // ignore stop words only when single, unadorned terms
+      if (stop
+          && field != Clause.DEFAULT_FIELD
+          && terms.size()==1
+          && isStopWord(array[0])) {
+        // ignore stop words only when single, unadorned terms in default field
       } else {
         if (prohibited)
           query.addProhibitedPhrase(array, field);
@@ -443,35 +446,11 @@
     finally { jj_save(2, xla); }
   }
 
-  final private boolean jj_3R_17() {
-    Token xsp;
-    xsp = jj_scanpos;
-    if (jj_scan_token(10)) {
-    jj_scanpos = xsp;
-    if (jj_scan_token(11)) {
-    jj_scanpos = xsp;
-    if (jj_scan_token(12)) {
-    jj_scanpos = xsp;
-    if (jj_scan_token(13)) {
-    jj_scanpos = xsp;
-    if (jj_scan_token(14)) return true;
-    }
-    }
-    }
-    }
-    return false;
-  }
-
   final private boolean jj_3R_26() {
     if (jj_3R_16()) return true;
     return false;
   }
 
-  final private boolean jj_3R_8() {
-    if (jj_3R_14()) return true;
-    return false;
-  }
-
   final private boolean jj_3R_16() {
     Token xsp;
     xsp = jj_scanpos;
@@ -496,6 +475,11 @@
     return false;
   }
 
+  final private boolean jj_3R_8() {
+    if (jj_3R_14()) return true;
+    return false;
+  }
+
   final private boolean jj_3R_15() {
     if (jj_3R_11()) return true;
     Token xsp;
@@ -524,18 +508,6 @@
     return false;
   }
 
-  final private boolean jj_3_1() {
-    if (jj_scan_token(WORD)) return true;
-    if (jj_scan_token(COLON)) return true;
-    Token xsp;
-    xsp = jj_scanpos;
-    if (jj_3R_8()) {
-    jj_scanpos = xsp;
-    if (jj_3R_9()) return true;
-    }
-    return false;
-  }
-
   final private boolean jj_3R_23() {
     if (jj_3R_24()) return true;
     return false;
@@ -562,6 +534,18 @@
     return false;
   }
 
+  final private boolean jj_3_1() {
+    if (jj_scan_token(WORD)) return true;
+    if (jj_scan_token(COLON)) return true;
+    Token xsp;
+    xsp = jj_scanpos;
+    if (jj_3R_8()) {
+    jj_scanpos = xsp;
+    if (jj_3R_9()) return true;
+    }
+    return false;
+  }
+
   final private boolean jj_3R_24() {
     Token xsp;
     xsp = jj_scanpos;
@@ -610,13 +594,13 @@
     return false;
   }
 
-  final private boolean jj_3R_9() {
-    if (jj_3R_15()) return true;
+  final private boolean jj_3R_19() {
+    if (jj_3R_24()) return true;
     return false;
   }
 
-  final private boolean jj_3R_19() {
-    if (jj_3R_24()) return true;
+  final private boolean jj_3R_9() {
+    if (jj_3R_15()) return true;
     return false;
   }
 
@@ -651,6 +635,25 @@
     if (jj_scan_token(9)) {
     jj_scanpos = xsp;
     if (jj_scan_token(0)) return true;
+    }
+    return false;
+  }
+
+  final private boolean jj_3R_17() {
+    Token xsp;
+    xsp = jj_scanpos;
+    if (jj_scan_token(10)) {
+    jj_scanpos = xsp;
+    if (jj_scan_token(11)) {
+    jj_scanpos = xsp;
+    if (jj_scan_token(12)) {
+    jj_scanpos = xsp;
+    if (jj_scan_token(13)) {
+    jj_scanpos = xsp;
+    if (jj_scan_token(14)) return true;
+    }
+    }
+    }
     }
     return false;
   }

Modified: 
incubator/nutch/trunk/src/java/org/apache/nutch/analysis/NutchAnalysis.jj
URL: 
http://svn.apache.org/viewcvs/incubator/nutch/trunk/src/java/org/apache/nutch/analysis/NutchAnalysis.jj?rev=179628&r1=179627&r2=179628&view=diff
==============================================================================
--- incubator/nutch/trunk/src/java/org/apache/nutch/analysis/NutchAnalysis.jj 
(original)
+++ incubator/nutch/trunk/src/java/org/apache/nutch/analysis/NutchAnalysis.jj 
Thu Jun  2 12:05:24 2005
@@ -204,8 +204,11 @@
     {
       String[] array = (String[])terms.toArray(new String[terms.size()]);
 
-      if (stop && terms.size()==1 && isStopWord(array[0])) {
-        // ignore stop words only when single, unadorned terms
+      if (stop
+          && field != Clause.DEFAULT_FIELD
+          && terms.size()==1
+          && isStopWord(array[0])) {
+        // ignore stop words only when single, unadorned terms in default field
       } else {
         if (prohibited)
           query.addProhibitedPhrase(array, field);




-------------------------------------------------------
This SF.Net email is sponsored by Yahoo.
Introducing Yahoo! Search Developer Network - Create apps using Yahoo!
Search APIs Find out how you can build Yahoo! directly into your own
Applications - visit http://developer.yahoo.net/?fr=offad-ysdn-ostg-q22005
_______________________________________________
Nutch-cvs mailing list
[email protected]
https://lists.sourceforge.net/lists/listinfo/nutch-cvs

Reply via email to