Revision: 7538
http://languagetool.svn.sourceforge.net/languagetool/?rev=7538&view=rev
Author: jaumeortola
Date: 2012-06-27 22:00:13 +0000 (Wed, 27 Jun 2012)
Log Message:
-----------
[ca] Fixed some false alarms. One new pattern rule: EN_LA_QUE. Test if the
speller uses the correct dictionary.
Modified Paths:
--------------
trunk/JLanguageTool/CHANGES.txt
trunk/JLanguageTool/src/resource/ca/disambiguation.xml
trunk/JLanguageTool/src/rules/ca/grammar.xml
trunk/JLanguageTool/src/test/org/languagetool/rules/ca/MorfologikCatalanSpellerRuleTest.java
Modified: trunk/JLanguageTool/CHANGES.txt
===================================================================
--- trunk/JLanguageTool/CHANGES.txt 2012-06-27 21:50:50 UTC (rev 7537)
+++ trunk/JLanguageTool/CHANGES.txt 2012-06-27 22:00:13 UTC (rev 7538)
@@ -30,7 +30,7 @@
-new synthesizer (given a part-of-speech, this generates the inflected word
forms) (Jaume Ortolà i Font)
-added spellcheck dictionary for the standalone version
- using Hunspell dictionary ca-valencia (avl) 2.3.0 by softcatala
+ using Hunspell dictionary ca-valencia (avl) 2.3.0 by Softcatalà
-Russian:
-fixed a few false alarms
Modified: trunk/JLanguageTool/src/resource/ca/disambiguation.xml
===================================================================
--- trunk/JLanguageTool/src/resource/ca/disambiguation.xml 2012-06-27
21:50:50 UTC (rev 7537)
+++ trunk/JLanguageTool/src/resource/ca/disambiguation.xml 2012-06-27
22:00:13 UTC (rev 7538)
@@ -4468,7 +4468,7 @@
<token postag="V.[MSI].*|_GV_" postag_regexp="yes"
negate_pos="yes"><exception postag="V.[MSI].*|_GV_"
postag_regexp="yes"/></token>
<marker>
<and>
- <token postag="NC.*" postag_regexp="yes"><exception
postag="_GN_.*" postag_regexp="yes" /></token>
+ <token postag="NC.*" postag_regexp="yes"><exception
postag="_GN_.*" postag_regexp="yes" /><exception>coma</exception></token>
<token postag="V.[MSI].*" postag_regexp="yes"><exception
postag="_GV_" /><exception regexp="yes">\p{Lu}+[\p{Ll}·]*</exception><exception
regexp="yes">[\p{Ll}·]+(e|[aei]sses|[ae]res|era)</exception></token>
<!-- problema: els noms acabats en -e no tenen comprovació
de concordança!! -->
</and>
Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml
===================================================================
--- trunk/JLanguageTool/src/rules/ca/grammar.xml 2012-06-27 21:50:50 UTC
(rev 7537)
+++ trunk/JLanguageTool/src/rules/ca/grammar.xml 2012-06-27 22:00:13 UTC
(rev 7538)
@@ -2442,7 +2442,7 @@
<example type="incorrect">La possibilitat <marker>de que</marker>
ho facis</example>
<example type="correct">La possibilitat <marker>que</marker> ho
facis</example>
</rule>
- <rule id="des_de" name="des de/que">
+ <rule id="DES_DE" name="des de/que">
<pattern>
<marker>
<token>des</token>
@@ -2518,6 +2518,17 @@
<example type="incorrect"><marker>Des de que</marker> m'ho vas
dir.</example>
<example type="correct"><marker>Des que</marker> m'ho vas
dir.</example>
</rule>
+ <rule id="EN_LA_QUE" name="*en la què">
+ <pattern>
+ <token postag="SPS00"/>
+ <token postag="DA.*" postag_regexp="yes"/>
+ <token>què</token>
+ </pattern>
+ <message>Cal dir <suggestion><match no="1"/> què</suggestion> o
<suggestion><match no="1"/> <match no="2"/> <match no="2" postag="DA..(.)."
postag_regexp="yes"
postag_replace="PR0C$1000">qual</match></suggestion>.</message>
+ <short>Expressió incorrecta</short>
+ <example type="incorrect">El lloc <marker>en el què</marker> el
van trobar</example>
+ <example type="correct">El lloc <marker>en què</marker> el van
trobar</example>
+ </rule>
</category>
<category name="Repeticions">
<rulegroup id="PHRASE_REPETITION" name="Repetició de dues paraules ('a
la a la')">
@@ -2908,7 +2919,8 @@
<example type="incorrect"><marker>Si</marker> que
vull.</example>
<example type="correct"><marker>Sí</marker> que vull.</example>
</rule>
- <rule>
+ <!-- Les regles de concordança fan millor la detecció -->
+ <!-- <rule>
<pattern>
<token>son<exception postag="_GN.*"
postag_regexp="yes"></exception></token>
</pattern>
@@ -2916,7 +2928,7 @@
<short>S'accentua si és del verb "ser".</short>
<example type="incorrect">Més del que
<marker>son</marker>.</example>
<example type="correct">Més del que
<marker>són</marker>.</example>
- </rule>
+ </rule> -->
<rule>
<pattern>
<token postag="V.*" postag_regexp="yes"></token>
Modified:
trunk/JLanguageTool/src/test/org/languagetool/rules/ca/MorfologikCatalanSpellerRuleTest.java
===================================================================
---
trunk/JLanguageTool/src/test/org/languagetool/rules/ca/MorfologikCatalanSpellerRuleTest.java
2012-06-27 21:50:50 UTC (rev 7537)
+++
trunk/JLanguageTool/src/test/org/languagetool/rules/ca/MorfologikCatalanSpellerRuleTest.java
2012-06-27 22:00:13 UTC (rev 7538)
@@ -50,6 +50,8 @@
assertEquals(0, rule.match(langTool.getAnalyzedSentence("Porta'n
quatre al col·legi.")).length);
assertEquals(0, rule.match(langTool.getAnalyzedSentence("Has de
portar-me'n moltes.")).length);
assertEquals(0, rule.match(langTool.getAnalyzedSentence(",")).length);
+ // Spellcheck dictionary contains Valencian and general accentuation
+ assertEquals(0, rule.match(langTool.getAnalyzedSentence("Francès i
francés.")).length);
//test for "LanguageTool":
This was sent by the SourceForge.net collaborative development platform, the
world's largest Open Source development site.
------------------------------------------------------------------------------
Live Security Virtual Conference
Exclusive live event will cover all the ways today's security and
threat landscape has changed and how IT managers can respond. Discussions
will include endpoint security, mobile security and the latest in malware
threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/
_______________________________________________
Languagetool-cvs mailing list
[email protected]
https://lists.sourceforge.net/lists/listinfo/languagetool-cvs