Revision: 6506 http://languagetool.svn.sourceforge.net/languagetool/?rev=6506&view=rev Author: dominikoeo Date: 2012-02-11 20:35:22 +0000 (Sat, 11 Feb 2012) Log Message: ----------- [br] detect errors in: - *An dra kenta?\195?\177* -> "An dra genta?\195?\177" - *Lakaet e vrezhoneg* -> "Lakaet e brezhoneg"
Modified Paths: -------------- trunk/JLanguageTool/src/resource/br/disambiguation.xml trunk/JLanguageTool/src/rules/br/grammar.xml Modified: trunk/JLanguageTool/src/resource/br/disambiguation.xml =================================================================== --- trunk/JLanguageTool/src/resource/br/disambiguation.xml 2012-02-11 19:23:13 UTC (rev 6505) +++ trunk/JLanguageTool/src/resource/br/disambiguation.xml 2012-02-11 20:35:22 UTC (rev 6506) @@ -166,6 +166,16 @@ <disambig action="remove"><wd lemma="e" pos="L e"/></disambig> </rule> </rulegroup> + <rulegroup id="E_P" name="e preposition"> + <rule> + <pattern mark="1"> + <token inflected="yes" regexp="yes">trein|lakaat|skrivañ</token> + <token postag="P">e</token> + <token postag_regexp="yes" postag="N.*" regexp="yes">.*eg</token> + </pattern> + <disambig postag="P"/> + </rule> + </rulegroup> <rulegroup id="NE_V" name="ne + verb"> <rule> <pattern mark="1"> @@ -175,4 +185,20 @@ <disambig><match no="1" postag_regexp="yes" postag="V.*"/></disambig> </rule> </rulegroup> + <rulegroup id="UR_N" name="ur + anv"> + <rule> + <pattern mark="1"> + <token>ur<exception scope="previous">en</exception></token> + <token postag="V.*" postag_regexp="yes"/> + </pattern> + <disambig action="filter" postag="N.*"/> + </rule> + <rule> + <pattern mark="1"> + <token regexp="yes">u[ln]|a[nlr]</token> + <token postag="V.*" postag_regexp="yes"/> + </pattern> + <disambig action="filter" postag="N.*"/> + </rule> + </rulegroup> </rules> Modified: trunk/JLanguageTool/src/rules/br/grammar.xml =================================================================== --- trunk/JLanguageTool/src/rules/br/grammar.xml 2012-02-11 19:23:13 UTC (rev 6505) +++ trunk/JLanguageTool/src/rules/br/grammar.xml 2012-02-11 20:35:22 UTC (rev 6506) @@ -1680,10 +1680,10 @@ <rulegroup id="KEMM_N_J" name="Kemmadur en anv-gwan o tont warlec’h an anv"> <rule> <pattern mark_from="1" mark_to="-1"> - <token regexp="yes">aer|amzer|avel|brud|c’hoari|c’hwezh|lann|lur|revr|tra</token> + <token regexp="yes">aer|amzer|avel|brud|c’hoari|c’hwezh|lann|lur|revr|[dt]ra</token> <token postag="J.*" postag_regexp="yes" inflected="yes" regexp="yes">[ktpgbm].* <exception postag="J[^M]*M.*:1:.*" postag_regexp="yes"/> - <exception postag="[^J].*" postag_regexp="yes"/> + <exception postag="J.*|K e sp o" postag_regexp="yes" negate_pos="yes"/> </token> <token negate="yes">ha</token> </pattern> @@ -1693,15 +1693,17 @@ <example type="correct">An avel <marker>greñv</marker>.</example> <example type="correct">Ur skol <marker>divyezhek</marker>.</example> <example type="correct">Ur skol <marker>zivyezhek</marker>.</example> + <example type="incorrect">An dra <marker>kentañ</marker>.</example> + <example type="correct">An dra <marker>gentañ</marker>.</example> </rule> <rule> <pattern mark_from="1" mark_to="-1"> <token postag="N f s.*|N m p t.*" postag_regexp="yes"> - <exception postag="N f p.*|N m s.*|N m p|N m p [^t].*" postag_regexp="yes"/> + <exception postag="N f p.*|N m s.*|N m p|N m p [^t].*|V.*" postag_regexp="yes"/> </token> <token postag="J.*" postag_regexp="yes" inflected="yes" regexp="yes">[gbm].* <exception postag="J[^M]*M.*:1:.*" postag_regexp="yes"/> - <exception postag="[^J].*" postag_regexp="yes"/> + <exception postag="J.*" postag_regexp="yes" negate_pos="yes"/> <!-- bennak is marked as an adjective in the diction, it should be an adverb --> <exception>bennak</exception> @@ -1724,11 +1726,11 @@ <rule> <pattern mark_from="1" mark_to="-1"> <token postag="N f s.*|N m p t.*" postag_regexp="yes" regexp="yes">.*[lmnrvaeiouwy] - <exception postag="N f p.*|N m s.*|N m p|N m p [^t].*" postag_regexp="yes"/> + <exception postag="N f p.*|N m s.*|N m p|N m p [^t].*|V.*" postag_regexp="yes"/> </token> <token postag="J.*" postag_regexp="yes" inflected="yes" regexp="yes">[ktp].* <exception postag="J[^M]*M.*:1:.*" postag_regexp="yes"/> - <exception postag="[^J].*" postag_regexp="yes"/> + <exception postag="J.*|K e sp o" postag_regexp="yes" negate_pos="yes"/> <!-- bennak is marked as an adjective in the diction, it should be an adverb --> <exception>bennak</exception> @@ -1740,6 +1742,8 @@ <example type="correct">Kendirvi binvidik.</example> <example type="correct">Tud kozh.</example> <example type="correct">Paotred pinvidik.</example> + <example type="incorrect">An dro <marker>kentañ</marker>.</example> + <example type="correct">An dro gentañ.</example> </rule> <rule> <pattern mark_from="1"> @@ -1749,8 +1753,8 @@ <exception>gwall</exception> </token> <and> - <token postag="J[^M]*M.*:1:.*" postag_regexp="yes"> - <exception negate_pos="yes" postag="SENT_END|[^M]*M.*" postag_regexp="yes"/> + <token postag="J.*" postag_regexp="yes"> + <exception negate_pos="yes" postag="SENT_END|J[^M]*M.*:1:.*" postag_regexp="yes"/> </token> <token regexp="yes">[gdb].*</token> </and> @@ -1777,10 +1781,10 @@ <exception regexp="yes" inflected="yes">.|re|aer|avel|brud|c’hoari|c’hwezh|gwall|lur|revr|seul|tra|war</exception> </token> <token postag="J[^M]*M:.*" postag_regexp="yes"> - <exception negate_pos="yes" postag="J[^M]*M:.*|SENT_END" postag_regexp="yes"/> + <exception negate_pos="yes" postag="J[^M]*M.*:1:.*|SENT_END" postag_regexp="yes"/> </token> </pattern> - <message>Ne zlefe bezañ ur c’hemmadur en anv-gwan «\2» goude an anv benel unan pe gourel lies «\1».</message> + <message>Ne zlefe bezañ ur c’hemmadur en anv-gwan «\2» goude an anv gourel unan pe benel lies «\1».</message> <example type="incorrect">Plac’hed <marker>vras</marker></example> <example type="incorrect">Plac’hed <marker>vras</marker>.</example> <example type="correct">Ur plac’h vras</example> @@ -1891,6 +1895,16 @@ <example type="correct">Ur c’hozh wetur.</example> </rule> </rulegroup> + <rule id="P_E" name="kemmadur ebet gant an araogenn «e»"> + <pattern mark_from="1"> + <token postag="P">e<exception negate_pos="yes" postag="P"/></token> + <token postag="N [^M]*M:.*" postag_regexp="yes"><exception postag="N [^M]*" postag_regexp="yes"/></token> + </pattern> + <message>Ne zlefe ket bezañ ur c’hemmadur goude an araogenn «e».</message> + <example type="incorrect">Lakaet e <marker>vrezhoneg</marker>.</example> + <example type="correct">Lakaet e brezhoneg.</example> + <example type="correct">Lenn a ra evit gwellaat e vrezhoneg.</example> + </rule> </category> <category name="Ger-mell"> This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. ------------------------------------------------------------------------------ Virtualization & Cloud Management Using Capacity Planning Cloud computing makes use of virtualization - but cloud computing also focuses on allowing computing to be delivered as a service. http://www.accelacomm.com/jaw/sfnl/114/51521223/ _______________________________________________ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs