Revision: 6023
          
http://languagetool.svn.sourceforge.net/languagetool/?rev=6023&view=rev
Author:   dominikoeo
Date:     2011-12-10 20:35:07 +0000 (Sat, 10 Dec 2011)
Log Message:
-----------
[br] - better disambiguation of the word "o" which
       allows detecting more incorrect mutations such as:
       *o patatez* ?\226?\134?\146 "o fatatez".
     - fixed a couple of false positives.

Modified Paths:
--------------
    trunk/JLanguageTool/src/resource/br/disambiguation.xml
    trunk/JLanguageTool/src/rules/br/grammar.xml

Modified: trunk/JLanguageTool/src/resource/br/disambiguation.xml
===================================================================
--- trunk/JLanguageTool/src/resource/br/disambiguation.xml      2011-12-10 
18:55:43 UTC (rev 6022)
+++ trunk/JLanguageTool/src/resource/br/disambiguation.xml      2011-12-10 
20:35:07 UTC (rev 6023)
@@ -39,6 +39,13 @@
       <disambig postag="P"/>
     </rule>
   </rulegroup>
+  <rule id="O_R" name="O pronoun">
+    <pattern mark="0">
+      <token>o</token>
+      <token postag="N .*" postag_regexp="yes"><exception postag="V 
inf.*"/></token>
+    </pattern>
+    <disambig postag="R e p 3 obj"/>
+  </rule>
   <rulegroup id="VERB_PARTICLE" name="verb particule">
     <rule>
       <pattern mark="0">

Modified: trunk/JLanguageTool/src/rules/br/grammar.xml
===================================================================
--- trunk/JLanguageTool/src/rules/br/grammar.xml        2011-12-10 18:55:43 UTC 
(rev 6022)
+++ trunk/JLanguageTool/src/rules/br/grammar.xml        2011-12-10 20:35:07 UTC 
(rev 6023)
@@ -699,6 +699,9 @@
         <example type="incorrect">Re ziwezhat out va 
<marker>baotr</marker>!</example>
         <example type="correct">Re ziwezhat out va faotr!</example>
         <example type="correct">Va beg digor</example>
+        <example type="incorrect">Bras eo o <marker>patatez</marker>.</example>
+        <example type="incorrect">Bras eo o <marker>batatez</marker>.</example>
+        <example type="correct">Bras eo o fatatez.</example>
       </rule>
       <rule>
         <pattern mark_from="1">
@@ -888,7 +891,7 @@
           <token regexp="yes">[au]n</token>
           <and>
             <token postag="N m s.*|N f p.*" postag_regexp="yes" 
regexp="yes">[dz].*
-              <exception regexp="yes">dra(-(mañ|se|hont))?</exception>
+              <exception regexp="yes">dra(ig)?(-(mañ|se|hont))?</exception>
               <exception postag="N m s.*|N f p.*" postag_regexp="yes" 
regexp="yes" inflected="yes">[dz].*</exception>
             </token>
             <token postag="N m s.*|N f p.*" postag_regexp="yes" regexp="yes" 
inflected="yes">t.*
@@ -1563,7 +1566,7 @@
     <rule id="AL" name="gerioù al, ul, el, hol">
       <pattern mark_to="-1">
         <token regexp="yes">[aeu][nr]|hor<exception postag="X EN_UR"/></token>
-        <token regexp="yes">l..*</token>
+        <token regexp="yes">l..*<exception regexp="yes" 
postag="UNKNOWN">L\p{Lu}*</exception></token>
       </pattern>
       <message>Ar ger «\1» a zlefe bezañ <suggestion><match no="1" 
regexp_match="(.*)." regexp_replace="$1l"/></suggestion> dirak ur ger a grog 
gant ar gensonenn «l».</message>
       <example type="incorrect"><marker>Ur</marker> levr a zo ganin.</example>
@@ -1576,6 +1579,7 @@
       <example type="correct">Tev eo hol levr.</example>
       <example type="correct">Kouezhet on en ur lammat.</example>
       <example type="correct">An l glebiet</example>
+      <example type="correct">An LTB</example>
     </rule>
     <rule id="AN" name="gerioù an, un, en, hon">
       <pattern mark_to="-1">
@@ -1609,7 +1613,7 @@
           <token regexp="yes">[aeu]n<exception scope="previous" 
regexp="yes">e?z|ned</exception></token>
           <token regexp="yes">[bcfgjkmprsvwyz].*
             <exception postag="K .* o.*" postag_regexp="yes"></exception>
-            <exception regexp="yes" 
postag="UNKNOWN">[FLMNRS]\p{Lu}*</exception>
+            <exception regexp="yes" 
postag="UNKNOWN">[FMNRS](\p{Lu}|-)*</exception>
             <exception regexp="yes">[FLMNRS]\d*</exception>
           </token>
         </pattern>
@@ -1621,6 +1625,7 @@
         <example type="correct">Ar ouiziegezh</example>
         <example type="incorrect"><marker>AN</marker> FILM A BLIJ DIN</example>
         <example type="correct">Gant an FSE</example>
+        <example type="correct">An SNJ-CGT</example>
         <example type="correct">Un S.O.S.</example>
         <example type="correct">Gustav ez an war-sav.</example>
       </rule>
@@ -2141,13 +2146,14 @@
     <rule id="E_KREIZ" name="e kreiz → e-kreiz (hag all)">
       <pattern>
         <token>e</token>
-        <token 
regexp="yes">barzh|douare|giz(-(all|mañ|se|hon))?|harz|hunan|keit(-se)?|kerz|kichen|krec’h|kreiz|lec’h|leizh|maez|pad|sell|ser|tailh|tal|touez|tro|unan</token>
+        <token 
regexp="yes">barzh|douare|giz(-(all|mañ|se|hon))?|harz|hunan|keit(-se)?|kerz|kichen|krec’h|kreiz|leizh|maez|pad|sell|ser|tailh|tal|touez|tro|unan</token>
       </pattern>
       <message>Implijit <suggestion>\1-\2</suggestion>.</message>
       <example type="incorrect"><marker>E kichen</marker> Gwitalmeze emañ o 
chom.</example>
       <example type="correct">E-kichen Gwitalmeze emañ o chom.</example>
       <example type="incorrect">Rwanda zo ur vro <marker>e kreiz</marker> 
Afrika.</example>
       <example type="correct">Rwanda zo ur vro e-kreiz Afrika.</example>
+      <example type="correct">E breizh hag <marker>e lec’h</marker> 
all.</example>
     </rule>
 
     <rule id="DIWAR_BENN" name="diwar benn → diwar-benn (hag all)">
@@ -2377,12 +2383,13 @@
     </rulegroup>
     <rule id="DIGAREZIT_DIN" name="Digarezit din → Digarezit ac’hanon">
       <pattern mark_from="1">
-        <token regexp="yes">digarez(it)?</token>
+        <token regexp="yes">digarez(it)?<exception 
scope="previous">un</exception></token>
         <token inflected="yes">da</token>
       </pattern>
       <message>Ne vez ket implijet an araogenn «da» gat ar verb «\1».</message>
       <example type="incorrect">Digarezit <marker>dimp</marker></example>
       <example type="correct">Digarezit ac’hanomp</example>
+      <example type="correct">Un digarez da ziskouez Breizh.</example>
     </rule>
     <rule id="A_RAOK_DA" name="Digarezit din → Digarezit ac’hanon">
       <pattern mark_from="1" mark_to="-1">

This was sent by the SourceForge.net collaborative development platform, the 
world's largest Open Source development site.


------------------------------------------------------------------------------
Learn Windows Azure Live!  Tuesday, Dec 13, 2011
Microsoft is holding a special Learn Windows Azure training event for 
developers. It will provide a great way to learn Windows Azure and what it 
provides. You can attend the event by watching it streamed LIVE online.  
Learn more at http://p.sf.net/sfu/ms-windowsazure
_______________________________________________
Languagetool-cvs mailing list
Languagetool-cvs@lists.sourceforge.net
https://lists.sourceforge.net/lists/listinfo/languagetool-cvs

Reply via email to