Author: ssmiweve
Date: 2007-06-08 10:52:26 +0200 (Fri, 08 Jun 2007)
New Revision: 5292

Modified:
   branches/2.13/query-api/src/main/javacc/QueryParserImpl.jj
Log:
SEARCH-2711 - Lang soekestreng gir veeeldig mange treff i katalog (hyphon 
variations)

Modified: branches/2.13/query-api/src/main/javacc/QueryParserImpl.jj
===================================================================
--- branches/2.13/query-api/src/main/javacc/QueryParserImpl.jj  2007-06-07 
20:30:17 UTC (rev 5291)
+++ branches/2.13/query-api/src/main/javacc/QueryParserImpl.jj  2007-06-08 
08:52:26 UTC (rev 5292)
@@ -61,6 +61,7 @@
     | < [ "\u007b"-"\u00bf" ] >
     | < [ "\u00d7" ] >
     | < [ "\u00f7" ] >
+    | < [ "\u2010"-"\u2015" ] >
 }
 
 /* These are the the above skip characters */
@@ -69,6 +70,7 @@
 /* . / */
 /* ; < = > ? @ */
 /* [ \ ] ^ _ ` */
+/* ‐ ‑ ‒ – — ― */
 
 
<DEFAULT,EMAIL_DISABLED,PHONE_NUMBER_DISABLED,NUMBER_GROUP_DISABLED,QUOTED_WORD_DISABLED>
 TOKEN : { <URL: "http://";<WORD>("/"<WORD>)*> }
@@ -101,25 +103,34 @@
     | <#PHONE_MIDDLE: ((" ")*<PHONE_SYMBOL>(" ")*)|(" ")+>
     | <#PHONE_SYMBOL: (".")|("-")|("/")>
     | <#WORD_SYMBOL_PREFIX: (".")|("<")|("=")|(">")>
-    | <#WORD_SYMBOL_MIDDLE: (".")|("-")|("_")|("+")>
+    | <#WORD_SYMBOL_MIDDLE: (".")|<HYPON>|("_")|("+")>
     | <#WORD_SEPARATOR: [ // just a copy of the SKIP declaration.
             " ", "!", 
             "\u0023"-"\u0040",
             "\u005b"-"\u0060",
             "\u007b"-"\u00bf",
             "\u00d7",
-            "\u00f7"
+            "\u00f7",
+            "\u2010"-"\u2015"
         ]>
+    | <#HYPON: // Different types of hypons, 
http://www.cs.tut.fi/~jkorpela/dashes.html
+        [
+            "-",
+            "\u2010"-"\u2015",
+            "\u207b",
+            "\u208b",
+            "\u2212"
+        ]>
     | <#LETTER:
-    /** UNICODE Characters **/
         [
             "\u0041"-"\u005a",
             "\u0061"-"\u007a",
             "\u00c0"-"\u00d6",
             "\u00d8"-"\u00f6",
-            "\u00f8"-"\uffff"
+            "\u00f8"-"\u200f",
+            "\u2016"-"\uffff"
         ]>
-    | < #DIGIT:                      // unicode digits
+    | <#DIGIT:
           [
            "\u0030"-"\u0039",
            "\u0660"-"\u0669",

_______________________________________________
Kernel-commits mailing list
[email protected]
http://sesat.no/mailman/listinfo/kernel-commits

Reply via email to