Revision: 7538 http://languagetool.svn.sourceforge.net/languagetool/?rev=7538&view=rev Author: jaumeortola Date: 2012-06-27 22:00:13 +0000 (Wed, 27 Jun 2012) Log Message: ----------- [ca] Fixed some false alarms. One new pattern rule: EN_LA_QUE. Test if the speller uses the correct dictionary.
Modified Paths: -------------- trunk/JLanguageTool/CHANGES.txt trunk/JLanguageTool/src/resource/ca/disambiguation.xml trunk/JLanguageTool/src/rules/ca/grammar.xml trunk/JLanguageTool/src/test/org/languagetool/rules/ca/MorfologikCatalanSpellerRuleTest.java Modified: trunk/JLanguageTool/CHANGES.txt =================================================================== --- trunk/JLanguageTool/CHANGES.txt 2012-06-27 21:50:50 UTC (rev 7537) +++ trunk/JLanguageTool/CHANGES.txt 2012-06-27 22:00:13 UTC (rev 7538) @@ -30,7 +30,7 @@ -new synthesizer (given a part-of-speech, this generates the inflected word forms) (Jaume Ortolà i Font) -added spellcheck dictionary for the standalone version - using Hunspell dictionary ca-valencia (avl) 2.3.0 by softcatala + using Hunspell dictionary ca-valencia (avl) 2.3.0 by Softcatalà -Russian: -fixed a few false alarms Modified: trunk/JLanguageTool/src/resource/ca/disambiguation.xml =================================================================== --- trunk/JLanguageTool/src/resource/ca/disambiguation.xml 2012-06-27 21:50:50 UTC (rev 7537) +++ trunk/JLanguageTool/src/resource/ca/disambiguation.xml 2012-06-27 22:00:13 UTC (rev 7538) @@ -4468,7 +4468,7 @@ <token postag="V.[MSI].*|_GV_" postag_regexp="yes" negate_pos="yes"><exception postag="V.[MSI].*|_GV_" postag_regexp="yes"/></token> <marker> <and> - <token postag="NC.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes" /></token> + <token postag="NC.*" postag_regexp="yes"><exception postag="_GN_.*" postag_regexp="yes" /><exception>coma</exception></token> <token postag="V.[MSI].*" postag_regexp="yes"><exception postag="_GV_" /><exception regexp="yes">\p{Lu}+[\p{Ll}·]*</exception><exception regexp="yes">[\p{Ll}·]+(e|[aei]sses|[ae]res|era)</exception></token> <!-- problema: els noms acabats en -e no tenen comprovació de concordança!! --> </and> Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml =================================================================== --- trunk/JLanguageTool/src/rules/ca/grammar.xml 2012-06-27 21:50:50 UTC (rev 7537) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml 2012-06-27 22:00:13 UTC (rev 7538) @@ -2442,7 +2442,7 @@ <example type="incorrect">La possibilitat <marker>de que</marker> ho facis</example> <example type="correct">La possibilitat <marker>que</marker> ho facis</example> </rule> - <rule id="des_de" name="des de/que"> + <rule id="DES_DE" name="des de/que"> <pattern> <marker> <token>des</token> @@ -2518,6 +2518,17 @@ <example type="incorrect"><marker>Des de que</marker> m'ho vas dir.</example> <example type="correct"><marker>Des que</marker> m'ho vas dir.</example> </rule> + <rule id="EN_LA_QUE" name="*en la què"> + <pattern> + <token postag="SPS00"/> + <token postag="DA.*" postag_regexp="yes"/> + <token>què</token> + </pattern> + <message>Cal dir <suggestion><match no="1"/> què</suggestion> o <suggestion><match no="1"/> <match no="2"/> <match no="2" postag="DA..(.)." postag_regexp="yes" postag_replace="PR0C$1000">qual</match></suggestion>.</message> + <short>Expressió incorrecta</short> + <example type="incorrect">El lloc <marker>en el què</marker> el van trobar</example> + <example type="correct">El lloc <marker>en què</marker> el van trobar</example> + </rule> </category> <category name="Repeticions"> <rulegroup id="PHRASE_REPETITION" name="Repetició de dues paraules ('a la a la')"> @@ -2908,7 +2919,8 @@ <example type="incorrect"><marker>Si</marker> que vull.</example> <example type="correct"><marker>Sí</marker> que vull.</example> </rule> - <rule> + <!-- Les regles de concordança fan millor la detecció --> + <!-- <rule> <pattern> <token>son<exception postag="_GN.*" postag_regexp="yes"></exception></token> </pattern> @@ -2916,7 +2928,7 @@ <short>S'accentua si és del verb "ser".</short> <example type="incorrect">Més del que <marker>son</marker>.</example> <example type="correct">Més del que <marker>són</marker>.</example> - </rule> + </rule> --> <rule> <pattern> <token postag="V.*" postag_regexp="yes"></token> Modified: trunk/JLanguageTool/src/test/org/languagetool/rules/ca/MorfologikCatalanSpellerRuleTest.java =================================================================== --- trunk/JLanguageTool/src/test/org/languagetool/rules/ca/MorfologikCatalanSpellerRuleTest.java 2012-06-27 21:50:50 UTC (rev 7537) +++ trunk/JLanguageTool/src/test/org/languagetool/rules/ca/MorfologikCatalanSpellerRuleTest.java 2012-06-27 22:00:13 UTC (rev 7538) @@ -50,6 +50,8 @@ assertEquals(0, rule.match(langTool.getAnalyzedSentence("Porta'n quatre al col·legi.")).length); assertEquals(0, rule.match(langTool.getAnalyzedSentence("Has de portar-me'n moltes.")).length); assertEquals(0, rule.match(langTool.getAnalyzedSentence(",")).length); + // Spellcheck dictionary contains Valencian and general accentuation + assertEquals(0, rule.match(langTool.getAnalyzedSentence("Francès i francés.")).length); //test for "LanguageTool": This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. ------------------------------------------------------------------------------ Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ _______________________________________________ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs