[LanguageTool] SF.net SVN: languagetool:[7350] trunk/JLanguageTool/src/java/org/ languagetool/language/Catalan.java
Revision: 7350 http://languagetool.svn.sourceforge.net/languagetool/?rev=7350view=rev Author: jaumeortola Date: 2012-06-15 10:04:24 + (Fri, 15 Jun 2012) Log Message: --- Jaume Ortola, new Catalan mantainer. Modified Paths: -- trunk/JLanguageTool/src/java/org/languagetool/language/Catalan.java Modified: trunk/JLanguageTool/src/java/org/languagetool/language/Catalan.java === --- trunk/JLanguageTool/src/java/org/languagetool/language/Catalan.java 2012-06-15 09:55:22 UTC (rev 7349) +++ trunk/JLanguageTool/src/java/org/languagetool/language/Catalan.java 2012-06-15 10:04:24 UTC (rev 7350) @@ -83,7 +83,7 @@ @Override public Contributor[] getMaintainers() { -return new Contributor[] {new Contributor(Ricard Roca)}; +return new Contributor[] {new Contributor(Ricard Roca), new Contributor(Jaume Ortolà) }; } @Override This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[7434] trunk/JLanguageTool/src/java/org/ languagetool/rules/ca/CatalanUnpairedQuestionMarksRule.java
Revision: 7434 http://languagetool.svn.sourceforge.net/languagetool/?rev=7434view=rev Author: jaumeortola Date: 2012-06-20 20:38:19 + (Wed, 20 Jun 2012) Log Message: --- [ca] CatalanUpairedQuestionMarksRule.java set off by default. Modified Paths: -- trunk/JLanguageTool/src/java/org/languagetool/rules/ca/CatalanUnpairedQuestionMarksRule.java Modified: trunk/JLanguageTool/src/java/org/languagetool/rules/ca/CatalanUnpairedQuestionMarksRule.java === --- trunk/JLanguageTool/src/java/org/languagetool/rules/ca/CatalanUnpairedQuestionMarksRule.java 2012-06-20 20:01:50 UTC (rev 7433) +++ trunk/JLanguageTool/src/java/org/languagetool/rules/ca/CatalanUnpairedQuestionMarksRule.java 2012-06-20 20:38:19 UTC (rev 7434) @@ -32,6 +32,7 @@ public CatalanUnpairedQuestionMarksRule(final ResourceBundle messages, final Language language) { super(messages, language); +setDefaultOff(); startSymbols = CA_START_SYMBOLS; endSymbols = CA_END_SYMBOLS; uniqueMapInit(); This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[7435] trunk/JLanguageTool/src
Revision: 7435 http://languagetool.svn.sourceforge.net/languagetool/?rev=7435view=rev Author: jaumeortola Date: 2012-06-20 21:16:19 + (Wed, 20 Jun 2012) Log Message: --- [ca] Fix some false alarms in PHRASE_REPETITION Modified Paths: -- trunk/JLanguageTool/src/resource/ca/disambiguation.xml trunk/JLanguageTool/src/rules/ca/grammar.xml Modified: trunk/JLanguageTool/src/resource/ca/disambiguation.xml === --- trunk/JLanguageTool/src/resource/ca/disambiguation.xml 2012-06-20 20:38:19 UTC (rev 7434) +++ trunk/JLanguageTool/src/resource/ca/disambiguation.xml 2012-06-20 21:16:19 UTC (rev 7435) @@ -31,8 +31,7 @@ /marker token regexp=yesde|del|dels|d'/token /pattern -disambig action=addwd lemma=enmig de pos=lt;LOC_PREPgt;/wd -/disambig +disambig action=addwd lemma=enmig de pos=lt;LOC_PREPgt;/wd/disambig /rule rule id=enmig2 name=locució prep pattern @@ -4699,4 +4698,28 @@ disambig action=filter postag=[^_].*/disambig /rule -- +!-- Útils per a algunes regles -- +rulegroup id=diferent_del_del name=diferent del del +rule +pattern +token regexp=yesdiferents?/token +marker +tokende/token +/marker +token postag=DA.* postag_regexp=yes/ +/pattern +disambig action=addwd pos=allow_repetition/wd/disambig +/rule +rule +pattern +tokena/token +tokendiferència/token +marker +tokende/token +/marker +token postag=DA.* postag_regexp=yes/ +/pattern +disambig action=addwd pos=allow_repetition/wd/disambig +/rule +/rulegroup /rules \ No newline at end of file Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/rules/ca/grammar.xml2012-06-20 20:38:19 UTC (rev 7434) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml2012-06-20 21:16:19 UTC (rev 7435) @@ -2825,19 +2825,20 @@ !-- made more general-- rule pattern -token negate_pos=yes postag=SENT_START regexp=yesexceptioni/exception\p{L}+/token -token regexp=yesexceptioni/exception\p{L}+/token -token -match no=0/matchexception postag=lt;/LOC_ADVgt; regexp=yespoc|més/exception/token -token -match no=1/matchexception postag=lt;/LOC_ADVgt; regexp=yespoc|més/exception/token +token negate_pos=yes postag=SENT_START regexp=yesexceptioni/exceptionexception postag=allow_repetitionde/exception[\p{L}·'-]+/token +token regexp=yesexceptioni/exception[\p{L}·'-]+/token +marker +tokenmatch no=0/matchexception postag=lt;/LOC_ADVgt; regexp=yespoc|més/exception/token +tokenmatch no=1/matchexception postag=lt;/LOC_ADVgt; regexp=yespoc|més/exception/token +/marker /pattern -messageAquesta frase és duplicada. Probablement hauria de ser suggestion\1 \2/suggestion./message +messageElimina la duplicació. suggestion/suggestion/message shortFrase duplicada/short -example correction=a casa type=incorrectBenvinguts markera casa a casa/marker meva./example -example type=correctBenviguts markera casa/marker meva./example +example correction= type=incorrectBenvinguts a casa markera casa/marker meva./example +example correction= type=incorrectÉs l'americà markerl'americà/marker./example example type=correctNo volia res més que mirar i mirar i mirar./example example type=correctA més a més, ho va fer a poc a poc./example +example type=correctA diferència dels dels ocells./example /rule /rulegroup rulegroup id=substantius_junts name=Dos noms comuns junts This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[7449] trunk/JLanguageTool/src/java/org/ languagetool/gui/Tools.java
Revision: 7449 http://languagetool.svn.sourceforge.net/languagetool/?rev=7449view=rev Author: jaumeortola Date: 2012-06-21 21:42:31 + (Thu, 21 Jun 2012) Log Message: --- Escape single quote in i18n messages. Modified Paths: -- trunk/JLanguageTool/src/java/org/languagetool/gui/Tools.java Modified: trunk/JLanguageTool/src/java/org/languagetool/gui/Tools.java === --- trunk/JLanguageTool/src/java/org/languagetool/gui/Tools.java 2012-06-21 20:44:04 UTC (rev 7448) +++ trunk/JLanguageTool/src/java/org/languagetool/gui/Tools.java 2012-06-21 21:42:31 UTC (rev 7449) @@ -43,7 +43,7 @@ public static String makeTexti18n(final ResourceBundle messages, final String key, final Object[] messageArguments) { final MessageFormat formatter = new MessageFormat(); -formatter.applyPattern(messages.getString(key)); +formatter.applyPattern(messages.getString(key).replaceAll(', '')); return formatter.format(messageArguments); } This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[7462] trunk/JLanguageTool/src
Revision: 7462 http://languagetool.svn.sourceforge.net/languagetool/?rev=7462view=rev Author: jaumeortola Date: 2012-06-22 16:14:30 + (Fri, 22 Jun 2012) Log Message: --- [ca] Minor change in ComplexAdjectiveConcordanceRule.java Modified Paths: -- trunk/JLanguageTool/src/java/org/languagetool/rules/ca/ComplexAdjectiveConcordanceRule.java trunk/JLanguageTool/src/rules/ca/grammar.xml trunk/JLanguageTool/src/test/org/languagetool/rules/ca/ComplexAdjectiveConcordanceRuleTest.java Modified: trunk/JLanguageTool/src/java/org/languagetool/rules/ca/ComplexAdjectiveConcordanceRule.java === --- trunk/JLanguageTool/src/java/org/languagetool/rules/ca/ComplexAdjectiveConcordanceRule.java 2012-06-22 15:46:38 UTC (rev 7461) +++ trunk/JLanguageTool/src/java/org/languagetool/rules/ca/ComplexAdjectiveConcordanceRule.java 2012-06-22 16:14:30 UTC (rev 7462) @@ -74,7 +74,7 @@ private static final Pattern UPPERCASE = Pattern.compile(\\p{Lu}[\\p{Ll}\u00B7]*); private static final Pattern COORDINACIO = Pattern.compile(,|i|o); private static final Pattern COORDINACIO_IONI = Pattern.compile(i|o|ni); - private static final Pattern KEEP_COUNT = Pattern.compile(AQ.*|N.*|D[AID].*|SPS.*|R.*); + private static final Pattern KEEP_COUNT = Pattern.compile(AQ.*|N.*|D[AID].*|SPS.*|R.*|V.P.*); private static final Pattern KEEP_COUNT2 = Pattern.compile(,|i|o|ni); private static final Pattern PREPOSICIONS = Pattern.compile(SPS.*); private static final Pattern VERB_AUXILIAR = Pattern.compile(V[AS].*); Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/rules/ca/grammar.xml2012-06-22 15:46:38 UTC (rev 7461) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml2012-06-22 16:14:30 UTC (rev 7462) @@ -275,7 +275,7 @@ example type=incorrectAixò markervermells/marker./example example type=correctAixò vermell./example /rule -rulegroup id=DET_POS_NOM name=concordança det+pos+nom +rulegroup id=CONCORDANCES_DET_POS_NOM name=concordances determinant + possessiu + nom rule pattern unify negate=yes Modified: trunk/JLanguageTool/src/test/org/languagetool/rules/ca/ComplexAdjectiveConcordanceRuleTest.java === --- trunk/JLanguageTool/src/test/org/languagetool/rules/ca/ComplexAdjectiveConcordanceRuleTest.java 2012-06-22 15:46:38 UTC (rev 7461) +++ trunk/JLanguageTool/src/test/org/languagetool/rules/ca/ComplexAdjectiveConcordanceRuleTest.java 2012-06-22 16:14:30 UTC (rev 7462) @@ -42,6 +42,7 @@ public void testRule() throws IOException { // correct sentences: + assertCorrect(instruments de càlcul basats en boles anomenats yupana.); assertCorrect(El rei ha trobat l'excusa i l'explicació adequades.); assertCorrect(El rei ha trobat l'excusa i l'explicació adequada.); assertCorrect(Copa del món femenina.); @@ -61,7 +62,7 @@ assertCorrect(Els períodes clàssic i medieval.); assertCorrect(Els costats superior i laterals.); assertCorrect(En una molècula de glucosa i una de fructosa unides.); - // Sholud be Incorrect, but it is impossible to detect + // Should be Incorrect, but it is impossible to detect assertCorrect(Índex de desenvolupament humà i qualitat de vida elevat); assertCorrect(Índex de desenvolupament humà i qualitat de vida elevats); assertCorrect(Índex de desenvolupament humà i qualitat de vida elevada); @@ -78,7 +79,7 @@ assertIncorrect(En una molècula de glucosa i una de fructosa units.); assertIncorrect(Un punt de densitat i gravetat infinits.); assertIncorrect(Índex de desenvolupament humà i qualitat de vida elevades.); - // Sholud be Incorrect, but it is impossible to detect + // Should be Incorrect, but it is impossible to detect // assertIncorrect(Índex de desenvolupament humà i qualitat de vida elevat); assertIncorrect(La massa, el radi i la lluminositat llistat per ell.); assertIncorrect(La massa, el radi i la lluminositat llistades per ell.); This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include
[LanguageTool] SF.net SVN: languagetool:[7509] trunk/JLanguageTool/src
Revision: 7509 http://languagetool.svn.sourceforge.net/languagetool/?rev=7509view=rev Author: jaumeortola Date: 2012-06-25 22:57:20 + (Mon, 25 Jun 2012) Log Message: --- [ca] Fixed some false alarms. Modified Paths: -- trunk/JLanguageTool/src/resource/ca/disambiguation.xml trunk/JLanguageTool/src/rules/ca/grammar.xml Modified: trunk/JLanguageTool/src/resource/ca/disambiguation.xml === --- trunk/JLanguageTool/src/resource/ca/disambiguation.xml 2012-06-25 22:29:21 UTC (rev 7508) +++ trunk/JLanguageTool/src/resource/ca/disambiguation.xml 2012-06-25 22:57:20 UTC (rev 7509) @@ -29,7 +29,7 @@ marker token regexp=yesenmig|entorn/token /marker -token regexp=yesde|del|dels|d'/token +token inflected=yesde/token /pattern disambig action=addwd lemma=enmig de pos=lt;LOC_PREPgt;/wd/disambig /rule @@ -37,7 +37,7 @@ pattern token regexp=yesenmig|entorn/token marker -token regexp=yesde|del|dels|d'/token +token inflected=yesde/token /marker /pattern disambig action=addwd lemma=enmig de pos=lt;/LOC_PREPgt;/wd @@ -698,8 +698,20 @@ /pattern disambig action=filter postag=lt;LOC_PREPgt; / /rule - rule +rule !-- cal controlar les excepcions -- pattern +token negate=yesque/token +marker +and +token postag=N.* postag_regexp=yesrespecte/token +token postag=V.* postag_regexp=yes/token +/and +/marker +/pattern +disambig action=filter postag=N.* / +/rule +rule +pattern token postag=V.[IS].* postag_regexp=yes/token marker and @@ -850,7 +862,7 @@ pattern token postag=N.* postag_regexp=yesexception postag=[NA].* postag_regexp=yes negate_pos=yes //token marker -token regexp=yespropietat|consort|mare|web|alfa|beta|gamma|lambda|font|hivernacle|euro|tipus|clau|membre|núm|número|matriu|estàndard|estrella|model/token +token regexp=yespropietat|consort|mare|web|alfa|beta|gamma|lambda|font|hivernacle|euro|tipus|clau|membre|núm|número|matriu|estàndard|estrella|model|base/token /marker /pattern disambig action=filter postag=AQ0CN0 / @@ -1087,6 +1099,27 @@ /pattern disambig action=addwd pos=_GV_/wd/disambig /rule +!-- haver + estat + participi -- +rule +pattern +token inflected=yeshaver/token +token postag=V.P.* postag_regexp=yes inflected=yesser/token +marker +token postag=V.P.* postag_regexp=yes/token +/marker +/pattern +disambig action=filter postag=V.P.*/disambig +/rule +rule +pattern +token inflected=yeshaver/token +token postag=V.P.* postag_regexp=yes inflected=yesser/token +marker +token postag=V.P.* postag_regexp=yes/token +/marker +/pattern +disambig action=addwd pos=_GV_/wd/disambig +/rule /rulegroup rulegroup id=haver_hi_auxiliar name=haver-hi auxiliar rule @@ -1841,9 +1874,22 @@ disambig action=filter postag=[^V].*/disambig !-- les dues meitats dreta i esquerra (A+N+V)-- /rule +rule id=verb_nom_sentstart2 name=verb i nom a principi de frase +pattern +token regexp=yes,|;/token +marker +and +token postag=V.[IS].* postag_regexp=yes/token +token postag=NC.* postag_regexp=yes/token +/and +/marker +token inflected=yes regexp=yesde|entre/token +/pattern +disambig action=filter postag=[^V].*/disambig +/rule rule id=verb_nomverb0 name=verb + verb/no_verb pattern -token postag=V.[MIS].* postag_regexp=yesexception postag=V.[MIS].* postag_regexp=yes negate_pos=yes//token +token postag=V.[NMIS].* postag_regexp=yesexception postag=V.[NMIS].*|complement postag_regexp=yes negate_pos=yes//token marker and token postag=V.[IS].* postag_regexp=yesexception postag=DI.* postag_regexp=yes//token !-- no té cap quantitat -- @@ -3321,7 +3367,7 @@ disambig action=filter postag=V.[^MNPG].*/disambig /rule /rulegroup -rule id=noVerb2
[LanguageTool] SF.net SVN: languagetool:[7531] trunk/JLanguageTool
Revision: 7531 http://languagetool.svn.sourceforge.net/languagetool/?rev=7531view=rev Author: jaumeortola Date: 2012-06-27 19:21:00 + (Wed, 27 Jun 2012) Log Message: --- [ca] Added source of spellcheck dictionary Modified Paths: -- trunk/JLanguageTool/CHANGES.txt trunk/JLanguageTool/src/rules/ca/grammar.xml Modified: trunk/JLanguageTool/CHANGES.txt === --- trunk/JLanguageTool/CHANGES.txt 2012-06-27 18:30:34 UTC (rev 7530) +++ trunk/JLanguageTool/CHANGES.txt 2012-06-27 19:21:00 UTC (rev 7531) @@ -30,6 +30,7 @@ -new synthesizer (given a part-of-speech, this generates the inflected word forms) (Jaume Ortolà i Font) -added spellcheck dictionary for the standalone version +using Hunspell dictionary ca-valencia (avl) 2.3.0 by softcatala -Russian: -fixed a few false alarms Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/rules/ca/grammar.xml2012-06-27 18:30:34 UTC (rev 7530) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml2012-06-27 19:21:00 UTC (rev 7531) @@ -659,7 +659,7 @@ /unify /marker !-- excloure totes les expressions temporals. Falta: els darrers vint anys, els caps de setmana... la major part, la majoria -- -token regexp=yes negate=yes\d+exception inflected=yes regexp=yesvegada|volta|cop|any|dia|mes|segle|setmana|gener|febrer|març|abril|maig|juny|juliol|agost|setembre|octubre|novembre|desembre/exception/token +token regexp=yes negate=yes[\d-]+exception inflected=yes regexp=yesvegada|volta|cop|any|dia|mes|segle|setmana|gener|febrer|març|abril|maig|juny|juliol|agost|setembre|octubre|novembre|desembre/exception/token tokenexception inflected=yes regexp=yesvegada|volta|cop|any|dia|mes|segle|setmana|gener|febrer|març|abril|maig|juny|juliol|agost|setembre|octubre|novembre|desembre/exception/token !-- excepcions: una altra vegada, els caps de setmana... -- tokenexception inflected=yes regexp=yesvegada|volta|cop|any|dia|mes|segle|setmana|gener|febrer|març|abril|maig|juny|juliol|agost|setembre|octubre|novembre|desembre/exception/token tokenexception inflected=yes regexp=yesvegada|volta|cop|any|dia|mes|segle|setmana/exception/token @@ -680,8 +680,6 @@ token postag=D[DAI].* postag_regexp=yesexception postag=RG|_GV_ postag_regexp=yes/exception regexp=yes\p{Lu}[\p{Ll}·]*/exception/token /unify /marker - -token regexp=yes negate=yes\d+/token /pattern messageError de concordança./message shortError de concordança./short This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[7538] trunk/JLanguageTool
Revision: 7538 http://languagetool.svn.sourceforge.net/languagetool/?rev=7538view=rev Author: jaumeortola Date: 2012-06-27 22:00:13 + (Wed, 27 Jun 2012) Log Message: --- [ca] Fixed some false alarms. One new pattern rule: EN_LA_QUE. Test if the speller uses the correct dictionary. Modified Paths: -- trunk/JLanguageTool/CHANGES.txt trunk/JLanguageTool/src/resource/ca/disambiguation.xml trunk/JLanguageTool/src/rules/ca/grammar.xml trunk/JLanguageTool/src/test/org/languagetool/rules/ca/MorfologikCatalanSpellerRuleTest.java Modified: trunk/JLanguageTool/CHANGES.txt === --- trunk/JLanguageTool/CHANGES.txt 2012-06-27 21:50:50 UTC (rev 7537) +++ trunk/JLanguageTool/CHANGES.txt 2012-06-27 22:00:13 UTC (rev 7538) @@ -30,7 +30,7 @@ -new synthesizer (given a part-of-speech, this generates the inflected word forms) (Jaume Ortolà i Font) -added spellcheck dictionary for the standalone version -using Hunspell dictionary ca-valencia (avl) 2.3.0 by softcatala +using Hunspell dictionary ca-valencia (avl) 2.3.0 by Softcatalà -Russian: -fixed a few false alarms Modified: trunk/JLanguageTool/src/resource/ca/disambiguation.xml === --- trunk/JLanguageTool/src/resource/ca/disambiguation.xml 2012-06-27 21:50:50 UTC (rev 7537) +++ trunk/JLanguageTool/src/resource/ca/disambiguation.xml 2012-06-27 22:00:13 UTC (rev 7538) @@ -4468,7 +4468,7 @@ token postag=V.[MSI].*|_GV_ postag_regexp=yes negate_pos=yesexception postag=V.[MSI].*|_GV_ postag_regexp=yes//token marker and -token postag=NC.* postag_regexp=yesexception postag=_GN_.* postag_regexp=yes //token +token postag=NC.* postag_regexp=yesexception postag=_GN_.* postag_regexp=yes /exceptioncoma/exception/token token postag=V.[MSI].* postag_regexp=yesexception postag=_GV_ /exception regexp=yes\p{Lu}+[\p{Ll}·]*/exceptionexception regexp=yes[\p{Ll}·]+(e|[aei]sses|[ae]res|era)/exception/token !-- problema: els noms acabats en -e no tenen comprovació de concordança!! -- /and Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/rules/ca/grammar.xml2012-06-27 21:50:50 UTC (rev 7537) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml2012-06-27 22:00:13 UTC (rev 7538) @@ -2442,7 +2442,7 @@ example type=incorrectLa possibilitat markerde que/marker ho facis/example example type=correctLa possibilitat markerque/marker ho facis/example /rule -rule id=des_de name=des de/que +rule id=DES_DE name=des de/que pattern marker tokendes/token @@ -2518,6 +2518,17 @@ example type=incorrectmarkerDes de que/marker m'ho vas dir./example example type=correctmarkerDes que/marker m'ho vas dir./example /rule +rule id=EN_LA_QUE name=*en la què +pattern +token postag=SPS00/ +token postag=DA.* postag_regexp=yes/ +tokenquè/token +/pattern +messageCal dir suggestionmatch no=1/ què/suggestion o suggestionmatch no=1/ match no=2/ match no=2 postag=DA..(.). postag_regexp=yes postag_replace=PR0C$1000qual/match/suggestion./message +shortExpressió incorrecta/short +example type=incorrectEl lloc markeren el què/marker el van trobar/example +example type=correctEl lloc markeren què/marker el van trobar/example +/rule /category category name=Repeticions rulegroup id=PHRASE_REPETITION name=Repetició de dues paraules ('a la a la') @@ -2908,7 +2919,8 @@ example type=incorrectmarkerSi/marker que vull./example example type=correctmarkerSí/marker que vull./example /rule -rule +!-- Les regles de concordança fan millor la detecció -- +!-- rule pattern tokensonexception postag=_GN.* postag_regexp=yes/exception/token /pattern @@ -2916,7 +2928,7 @@ shortS'accentua si és del verb ser./short example type=incorrectMés del que markerson/marker./example example type=correctMés del que markersón/marker./example -/rule +/rule -- rule pattern token postag=V.* postag_regexp=yes/token Modified: trunk/JLanguageTool/src/test/org/languagetool/rules/ca/MorfologikCatalanSpellerRuleTest.java === --- trunk/JLanguageTool/src/test/org
[LanguageTool] SF.net SVN: languagetool:[7542] trunk/JLanguageTool/src/resource/ca
Revision: 7542 http://languagetool.svn.sourceforge.net/languagetool/?rev=7542view=rev Author: jaumeortola Date: 2012-06-28 16:13:49 + (Thu, 28 Jun 2012) Log Message: --- [ca] Words added to the tagger dictionary: adverbs -ment, toponyms. Modified Paths: -- trunk/JLanguageTool/src/resource/ca/catalan.dict trunk/JLanguageTool/src/resource/ca/catalan_synth.dict trunk/JLanguageTool/src/resource/ca/disambiguation.xml Modified: trunk/JLanguageTool/src/resource/ca/catalan.dict === (Binary files differ) Modified: trunk/JLanguageTool/src/resource/ca/catalan_synth.dict === (Binary files differ) Modified: trunk/JLanguageTool/src/resource/ca/disambiguation.xml === --- trunk/JLanguageTool/src/resource/ca/disambiguation.xml 2012-06-28 14:57:48 UTC (rev 7541) +++ trunk/JLanguageTool/src/resource/ca/disambiguation.xml 2012-06-28 16:13:49 UTC (rev 7542) @@ -519,7 +519,7 @@ /rule /rulegroup !--crea etiquetes per als adverbis acabats en -ment-- -rulegroup id=adverbis_ment name=marca adverbis acabats en ment +!-- rulegroup id=adverbis_ment name=marca adverbis acabats en ment rule pattern marker @@ -538,7 +538,7 @@ disambig action=addwd pos=RG/wd /disambig /rule -/rulegroup +/rulegroup -- rulegroup id=interjeccions name=interjeccions rule pattern This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[7655] trunk/JLanguageTool/src/rules/ca/grammar. xml
Revision: 7655 http://languagetool.svn.sourceforge.net/languagetool/?rev=7655view=rev Author: jaumeortola Date: 2012-07-06 21:25:22 + (Fri, 06 Jul 2012) Log Message: --- [ca] new rule STATU_QUO. Modified Paths: -- trunk/JLanguageTool/src/rules/ca/grammar.xml Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/rules/ca/grammar.xml2012-07-06 18:15:41 UTC (rev 7654) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml2012-07-06 21:25:22 UTC (rev 7655) @@ -4329,7 +4329,7 @@ rulegroup id=EVITA_ACCENTUACIO_NO_VALENCIANA name=Evita l'accentuació general no valenciana (cafè, sotmès, conèixer) rule pattern -token regexp=yes.+è|.+ès|.+ènexception regexp=yesperquè|què|Novetlè/exception/token +token regexp=yes.+è|.+ès|.+ènexception regexp=yesperquès?|quès?|Novetlè/exception/token /pattern messageAccentuació no valenciana. Substituïu per: suggestionmatch no=1 regexp_match=^(.+)è(s|n)? regexp_replace=$1é$2/match/suggestion/message shortAccentuació no valenciana./short @@ -6366,7 +6366,7 @@ /example /rule /rulegroup -rule id=DONAR_A_LABAST name=donar l'abast +rule id=DONAR_LABAST name=*donar a l'abast/donar l'abast pattern token inflected=yesdonar/token tokena/token @@ -6378,6 +6378,16 @@ example type=incorrectNo markerdono a l'abast/marker/example example type=correctNo markerdono l'abast/marker/example /rule +rule id=STATU_QUO name=statu/*estatus quo +pattern +tokenestatus/token +tokenquo/token +/pattern +messageCal dir suggestionstatu quo/suggestion./message +shortExpressió incorrecta/short +example type=incorrectmarkerestatus quo/marker/example +example type=correctstatu quo/example +/rule /category !-- category name=Sintaxi rulegroup id=ordre_dubtos name=ordres de frase dubtosos This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[7690] trunk/JLanguageTool/src/rules/ca/grammar. xml
Revision: 7690 http://languagetool.svn.sourceforge.net/languagetool/?rev=7690view=rev Author: jaumeortola Date: 2012-07-10 21:09:35 + (Tue, 10 Jul 2012) Log Message: --- [ca] New rule: SI_QUE Modified Paths: -- trunk/JLanguageTool/src/rules/ca/grammar.xml Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/rules/ca/grammar.xml2012-07-10 20:24:33 UTC (rev 7689) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml2012-07-10 21:09:35 UTC (rev 7690) @@ -1968,6 +1968,19 @@ example type=correctmarkerúnicament/marker i exclusivament/example /rule /rulegroup +rule id=SI_QUE name=*sí m'agrada/sí que m'agrada +pattern +marker +token skip=3síexception postag=_GN_MS/exception postag=PP.*|P0.*|V.*|_GV_|SENT_END scope=next postag_regexp=yes negate_pos=yes//token +/marker +token postag=V.[MIS].* postag_regexp=yes/ +/pattern +messageCal dir: suggestionsí que/suggestion./message +example type=incorrectTu markersí/marker hauries respost bé./example +example type=incorrectTu markersí/marker li hauries respost bé./example +example type=correctTu sí que hauries respost bé./example +example type=correctEl sí va acompanyat de dubtes./example +/rule /category category name=Preposicions rulegroup id=MALGRAT name=malgrat (que) This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[7693] trunk/JLanguageTool/src/rules/ca/grammar. xml
Revision: 7693 http://languagetool.svn.sourceforge.net/languagetool/?rev=7693view=rev Author: jaumeortola Date: 2012-07-11 14:08:11 + (Wed, 11 Jul 2012) Log Message: --- [ca] New rule: ALGUN_QUE_ALTRE. Modified Paths: -- trunk/JLanguageTool/src/rules/ca/grammar.xml Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/rules/ca/grammar.xml2012-07-11 10:56:40 UTC (rev 7692) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml2012-07-11 14:08:11 UTC (rev 7693) @@ -6535,6 +6535,34 @@ example type=incorrectmarkerestatus quo/marker/example example type=correctstatu quo/example /rule +rulegroup id=ALGUN_QUE_ALTRE name=*algun que altre +rule +pattern +tokenalgun/token +tokenque/token +tokenaltre/token +token postag=NCMS000/ +/pattern +messageExpressió incorrecta: suggestionalguns match no=4 postag=NCMP000//suggestion, + suggestionalgun match no=4/ o altre/suggestion./message +shortExpressió incorrecta/short +example type=incorrectalgun que altre home/example +example type=correctalguns homes/example +/rule +rule +pattern +tokenalguna/token +tokenque/token +tokenaltra/token +token postag=NCFS000/ +/pattern +messageExpressió incorrecta: suggestionalgunes match no=4 postag=NCFP000//suggestion, + suggestionalguna match no=4/ o altra/suggestion./message +shortExpressió incorrecta/short +example type=incorrectalguna que altra dona/example +example type=correctalgunes dones/example +/rule +/rulegroup /category !-- category name=Sintaxi rulegroup id=ordre_dubtos name=ordres de frase dubtosos This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[7694] trunk/JLanguageTool/src/rules/ca/grammar. xml
Revision: 7694 http://languagetool.svn.sourceforge.net/languagetool/?rev=7694view=rev Author: jaumeortola Date: 2012-07-11 15:33:49 + (Wed, 11 Jul 2012) Log Message: --- [ca] error corrected, new rule ALGUN_QUE_ALTRE. Modified Paths: -- trunk/JLanguageTool/src/rules/ca/grammar.xml Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/rules/ca/grammar.xml2012-07-11 14:08:11 UTC (rev 7693) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml2012-07-11 15:33:49 UTC (rev 7694) @@ -6546,7 +6546,7 @@ messageExpressió incorrecta: suggestionalguns match no=4 postag=NCMP000//suggestion, suggestionalgun match no=4/ o altre/suggestion./message shortExpressió incorrecta/short -example type=incorrectalgun que altre home/example +example type=incorrectmarkeralgun que altre home/marker/example example type=correctalguns homes/example /rule rule @@ -6559,7 +6559,7 @@ messageExpressió incorrecta: suggestionalgunes match no=4 postag=NCFP000//suggestion, suggestionalguna match no=4/ o altra/suggestion./message shortExpressió incorrecta/short -example type=incorrectalguna que altra dona/example +example type=incorrectmarkeralguna que altra dona/marker/example example type=correctalgunes dones/example /rule /rulegroup This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[7708] trunk/JLanguageTool/src
Revision: 7708 http://languagetool.svn.sourceforge.net/languagetool/?rev=7708view=rev Author: jaumeortola Date: 2012-07-16 11:08:26 + (Mon, 16 Jul 2012) Log Message: --- [ca] Java rule improved ACCENTUATION_CHECK. Modified Paths: -- trunk/JLanguageTool/src/java/org/languagetool/rules/ca/AccentuationCheckRule.java trunk/JLanguageTool/src/test/org/languagetool/rules/ca/AccentuationCheckRuleTest.java Modified: trunk/JLanguageTool/src/java/org/languagetool/rules/ca/AccentuationCheckRule.java === --- trunk/JLanguageTool/src/java/org/languagetool/rules/ca/AccentuationCheckRule.java 2012-07-15 13:31:59 UTC (rev 7707) +++ trunk/JLanguageTool/src/java/org/languagetool/rules/ca/AccentuationCheckRule.java 2012-07-16 11:08:26 UTC (rev 7708) @@ -67,10 +67,10 @@ private static final Pattern NOM_FS = Pattern.compile(NC[FC][SN].*); private static final Pattern NOM_MP = Pattern.compile(NC[MC][PN].*); private static final Pattern NOM_FP = Pattern.compile(NC[FC][PN].*); - private static final Pattern ADJECTIU_MS = Pattern.compile(AQ.[MC][SN].*|V.P..SM); - private static final Pattern ADJECTIU_FS = Pattern.compile(AQ.[FC][SN].*|V.P..SF); - private static final Pattern ADJECTIU_MP = Pattern.compile(AQ.[MC][PN].*|V.P..PM); - private static final Pattern ADJECTIU_FP = Pattern.compile(AQ.[FC][PN].*|V.P..PF); + private static final Pattern ADJECTIU_MS = Pattern.compile(AQ.[MC][SN].*|V.P..SM|PX.MS.*); + private static final Pattern ADJECTIU_FS = Pattern.compile(AQ.[FC][SN].*|V.P..SF|PX.FS.*); + private static final Pattern ADJECTIU_MP = Pattern.compile(AQ.[MC][PN].*|V.P..PM|PX.MP.*); + private static final Pattern ADJECTIU_FP = Pattern.compile(AQ.[FC][PN].*|V.P..PF|PX.FP.*); private static final Pattern INFINITIU = Pattern.compile(V.N.*); private static final Pattern VERB_CONJUGAT = Pattern.compile(V.[^NGP].*); private static final Pattern NOT_IN_PREV_TOKEN = Pattern.compile(VA.*|PP.*|P0.*|VSP.*); @@ -188,6 +188,7 @@ //circumstancies extraordinàries else if ( !token.equals(pronuncia) !token.equals(pronuncies) !token.equals(venia) !token.equals(venies) !token.equals(tenia) !token.equals(tenies) !token.equals(continua) !token.equals(continues) + !token.equals(genera) (itokens.length-1) ( (matchPostagRegexp(relevantWords.get(token),NOM_MS) matchPostagRegexp(tokens[i+1],ADJECTIU_MS)) @@ -199,6 +200,17 @@ { replacement = relevantWords.get(token).getToken(); } + //les seves contraries + else if ( + (matchPostagRegexp(relevantWords.get(token),NOM_MS) matchPostagRegexp(tokens[i-1],ADJECTIU_MS)) + || (matchPostagRegexp(relevantWords.get(token),NOM_FS) matchPostagRegexp(tokens[i-1],ADJECTIU_FS) +!token.equals(venia) !token.equals(tenia) !token.equals(continua) !token.equals(genera) ) + || (matchPostagRegexp(relevantWords.get(token),NOM_MP) matchPostagRegexp(tokens[i-1],ADJECTIU_MP)) + || (matchPostagRegexp(relevantWords.get(token),NOM_FP) matchPostagRegexp(tokens[i-1],ADJECTIU_FP)) + ) + { + replacement = relevantWords.get(token).getToken(); + } // les circumstancies que ens envolten else if ( nextToken.equals(que) ( ( mArticleELMS.matches() matchPostagRegexp(relevantWords.get(token),NOM_MS) ) Modified: trunk/JLanguageTool/src/test/org/languagetool/rules/ca/AccentuationCheckRuleTest.java === --- trunk/JLanguageTool/src/test/org/languagetool/rules/ca/AccentuationCheckRuleTest.java 2012-07-15 13:31:59 UTC (rev 7707) +++ trunk/JLanguageTool/src/test/org/languagetool/rules/ca/AccentuationCheckRuleTest.java 2012-07-16 11:08:26 UTC (rev 7708) @@ -43,6 +43,8 @@ public void testRule() throws IOException { // correct sentences: + assertCorrect(El cos genera suficient pressió interna.); + assertCorrect(Les seues contràries.); assertCorrect(Això és una frase de prova.); assertCorrect(Amb renúncies i esforç.); assertCorrect(He vingut per a cantar); @@ -67,6 +69,7 @@ assertCorrect(La magnífica conservació del palau.); // errors: +assertIncorrect(Les seues contraries.); assertIncorrect(Amb renuncies i esforç.); assertIncorrect(La renuncia del president.); assertIncorrect(Són circumstancies d'un altre caire.); This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways
[LanguageTool] SF.net SVN: languagetool:[7760] trunk/JLanguageTool/src
Revision: 7760 http://languagetool.svn.sourceforge.net/languagetool/?rev=7760view=rev Author: jaumeortola Date: 2012-07-27 16:59:12 + (Fri, 27 Jul 2012) Log Message: --- [ca] Java rule improved: AccentuationCheckRule Modified Paths: -- trunk/JLanguageTool/src/java/org/languagetool/rules/ca/AccentuationCheckRule.java trunk/JLanguageTool/src/resource/ca/catalan.dict trunk/JLanguageTool/src/resource/ca/catalan_synth.dict trunk/JLanguageTool/src/resource/ca/disambiguation.xml trunk/JLanguageTool/src/rules/ca/verb_senseaccent_nom_ambaccent.txt trunk/JLanguageTool/src/test/org/languagetool/rules/ca/AccentuationCheckRuleTest.java Modified: trunk/JLanguageTool/src/java/org/languagetool/rules/ca/AccentuationCheckRule.java === --- trunk/JLanguageTool/src/java/org/languagetool/rules/ca/AccentuationCheckRule.java 2012-07-27 11:43:33 UTC (rev 7759) +++ trunk/JLanguageTool/src/java/org/languagetool/rules/ca/AccentuationCheckRule.java 2012-07-27 16:59:12 UTC (rev 7760) @@ -58,7 +58,7 @@ private static final Pattern ARTICLE_EL_FS = Pattern.compile(la|l'|La|L'); private static final Pattern ARTICLE_EL_MP = Pattern.compile(els|Els); private static final Pattern ARTICLE_EL_FP = Pattern.compile(les|Les); -// private static final Pattern DETERMINANT = Pattern.compile(D[^R].*); + private static final Pattern DETERMINANT = Pattern.compile(D[^R].*); private static final Pattern DETERMINANT_MS = Pattern.compile(D[^R].[MC][SN].*); private static final Pattern DETERMINANT_FS = Pattern.compile(D[^R].[FC][SN].*); private static final Pattern DETERMINANT_MP = Pattern.compile(D[^R].[MC][PN].*); @@ -72,7 +72,7 @@ private static final Pattern ADJECTIU_MP = Pattern.compile(AQ.[MC][PN].*|V.P..PM|PX.MP.*); private static final Pattern ADJECTIU_FP = Pattern.compile(AQ.[FC][PN].*|V.P..PF|PX.FP.*); private static final Pattern INFINITIU = Pattern.compile(V.N.*); - private static final Pattern VERB_CONJUGAT = Pattern.compile(V.[^NGP].*); + private static final Pattern VERB_CONJUGAT = Pattern.compile(V.[^NGP].*|_GV_); private static final Pattern NOT_IN_PREV_TOKEN = Pattern.compile(VA.*|PP.*|P0.*|VSP.*); private static final Pattern BEFORE_ADJECTIVE_MS = Pattern.compile(SPS00|D[^R].[MC][SN].*|V.[^NGP].*|PX.*); private static final Pattern BEFORE_ADJECTIVE_FS = Pattern.compile(SPS00|D[^R].[FC][SN].*|V.[^NGP].*|PX.*); @@ -146,8 +146,8 @@ // verb without accent - noun with accent if (isRelevantWord) { - //amb renuncies -if (tokens[i-1].hasPosTag(SPS00) !matchPostagRegexp(tokens[i],INFINITIU) ) + //amb renuncies DETERMINANT +if (tokens[i-1].hasPosTag(SPS00) !matchPostagRegexp(tokens[i-1],DETERMINANT) !matchPostagRegexp(tokens[i],INFINITIU) ) { replacement = relevantWords.get(token).getToken(); } @@ -157,13 +157,23 @@ !token.equals(cantar) ) ||(matchPostagRegexp(tokens[i-1],DETERMINANT_MP) matchPostagRegexp(relevantWords.get(token),NOM_MP)) ||(matchPostagRegexp(tokens[i-1],DETERMINANT_FS) matchPostagRegexp(relevantWords.get(token),NOM_FS) - !token.equals(venia) !token.equals(tenia) !token.equals(continua) !token.equals(genera) ) + !token.equals(venia) !token.equals(tenia) !token.equals(continua) !token.equals(genera) !token.equals(faria)) ||(matchPostagRegexp(tokens[i-1],DETERMINANT_FP) matchPostagRegexp(relevantWords.get(token),NOM_FP)) ) ) { replacement = relevantWords.get(token).getToken(); } + //fumaré una faria (correct: fària) + else if ( i2 matchPostagRegexp(tokens[i-2],VERB_CONJUGAT) +((matchPostagRegexp(tokens[i-1],DETERMINANT_MS) matchPostagRegexp(relevantWords.get(token),NOM_MS)) + ||(matchPostagRegexp(tokens[i-1],DETERMINANT_MP) matchPostagRegexp(relevantWords.get(token),NOM_MP)) + ||(matchPostagRegexp(tokens[i-1],DETERMINANT_FS) matchPostagRegexp(relevantWords.get(token),NOM_FS)) + ||(matchPostagRegexp(tokens[i-1],DETERMINANT_FP) matchPostagRegexp(relevantWords.get(token),NOM_FP)) ) ) + { + replacement = relevantWords.get(token).getToken(); + } //circumstancies d'un altre caire else if ( !token.equals(venia) !token.equals(venies) !token.equals(tenia) !token.equals(tenies) + !token.equals(faria) !token.equals(faries) !token.equals(continua) !token.equals(continues) !token.equals(cantar) mPreposicioDE.matches() !matchPostagRegexp(tokens[i-1],NOT_IN_PREV_TOKEN) (itokens.length-2) !matchPostagRegexp(tokens[i+2],INFINITIU) @@ -173,6 +183,7 @@ } //la renuncia del president
[LanguageTool] SF.net SVN: languagetool:[7762] trunk/JLanguageTool/src
Revision: 7762 http://languagetool.svn.sourceforge.net/languagetool/?rev=7762view=rev Author: jaumeortola Date: 2012-07-27 18:02:52 + (Fri, 27 Jul 2012) Log Message: --- [ca] Improved rule: DALT. Modified Paths: -- trunk/JLanguageTool/src/java/org/languagetool/rules/ca/AccentuationCheckRule.java trunk/JLanguageTool/src/rules/ca/grammar.xml Modified: trunk/JLanguageTool/src/java/org/languagetool/rules/ca/AccentuationCheckRule.java === --- trunk/JLanguageTool/src/java/org/languagetool/rules/ca/AccentuationCheckRule.java 2012-07-27 17:09:32 UTC (rev 7761) +++ trunk/JLanguageTool/src/java/org/languagetool/rules/ca/AccentuationCheckRule.java 2012-07-27 18:02:52 UTC (rev 7762) @@ -146,7 +146,7 @@ // verb without accent - noun with accent if (isRelevantWord) { - //amb renuncies DETERMINANT + //amb renuncies if (tokens[i-1].hasPosTag(SPS00) !matchPostagRegexp(tokens[i-1],DETERMINANT) !matchPostagRegexp(tokens[i],INFINITIU) ) { replacement = relevantWords.get(token).getToken(); Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/rules/ca/grammar.xml2012-07-27 17:09:32 UTC (rev 7761) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml2012-07-27 18:02:52 UTC (rev 7762) @@ -2278,19 +2278,47 @@ example type=correctVa estar a punt de morir./example /rule /rulegroup -rule id=DALT name=d'alt/dalt -pattern -token regexp=yesa|fins|de/token -marker -tokend'/token -tokenalt/token -/marker -/pattern -messagePotser és: suggestiondalt/suggestion./message -shortConfusió./short -example type=incorrectVan pujar fins markerd'alt/marker./example -example type=correctVan pujar fins markerdalt/marker./example -/rule +rulegroup id=DALT name=*d'alt/dalt +rule +pattern +token regexp=yesa|fins|de/token +marker +tokend'/token +tokenalt/token +/marker +/pattern +messagePotser és: suggestiondalt/suggestion./message +shortConfusió./short +example type=incorrectVan pujar fins markerd'alt/marker./example +example type=correctVan pujar fins markerdalt/marker./example +/rule +rule +pattern +marker +tokend'/token +tokenalt/token +/marker +token postag=D[AID].* postag_regexp=yes/token +/pattern +messagePotser és: suggestiondalt/suggestion./message +shortConfusió./short +example type=incorrectVan pujar markerd'alt/marker la terrassa./example +example type=correctVan pujar dalt la terrassa./example +/rule +rule +pattern +marker +tokend'/token +tokenalt/token +/marker +token inflected=yesde/token +/pattern +messagePotser és: suggestiondalt/suggestion./message +shortConfusió./short +example type=incorrectVan pujar markerd'alt/marker de tot./example +example type=correctVan pujar dalt de tot./example +/rule +/rulegroup rulegroup id=DARRERA name=darrera/darrere rule pattern This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[7765] trunk/JLanguageTool/src
Revision: 7765 http://languagetool.svn.sourceforge.net/languagetool/?rev=7765view=rev Author: jaumeortola Date: 2012-07-27 23:45:40 + (Fri, 27 Jul 2012) Log Message: --- [ca] Fixed some false alarms. Modified Paths: -- trunk/JLanguageTool/src/java/org/languagetool/rules/ca/ComplexAdjectiveConcordanceRule.java trunk/JLanguageTool/src/resource/ca/disambiguation.xml trunk/JLanguageTool/src/rules/ca/grammar.xml Modified: trunk/JLanguageTool/src/java/org/languagetool/rules/ca/ComplexAdjectiveConcordanceRule.java === --- trunk/JLanguageTool/src/java/org/languagetool/rules/ca/ComplexAdjectiveConcordanceRule.java 2012-07-27 22:18:47 UTC (rev 7764) +++ trunk/JLanguageTool/src/java/org/languagetool/rules/ca/ComplexAdjectiveConcordanceRule.java 2012-07-27 23:45:40 UTC (rev 7765) @@ -76,7 +76,7 @@ private static final Pattern COORDINACIO = Pattern.compile(,|i|o); private static final Pattern COORDINACIO_IONI = Pattern.compile(i|o|ni); private static final Pattern KEEP_COUNT = Pattern.compile(A.*|N.*|D[NAID].*|SPS.*|R.*|V.P.*); - private static final Pattern KEEP_COUNT2 = Pattern.compile(,|i|o|ni); + private static final Pattern KEEP_COUNT2 = Pattern.compile(,|i|o|ni|\\d+); private static final Pattern PREPOSICIONS = Pattern.compile(SPS.*); private static final Pattern VERB_AUXILIAR = Pattern.compile(V[AS].*); private static final Pattern EXCEPCIONS_PARTICIPI = Pattern.compile(atès|atés|atesa|atesos|ateses|donat|donats|donada|donades); Modified: trunk/JLanguageTool/src/resource/ca/disambiguation.xml === --- trunk/JLanguageTool/src/resource/ca/disambiguation.xml 2012-07-27 22:18:47 UTC (rev 7764) +++ trunk/JLanguageTool/src/resource/ca/disambiguation.xml 2012-07-27 23:45:40 UTC (rev 7765) @@ -4712,7 +4712,7 @@ marker and token postag=A.* postag_regexp=yesexception postag=_GN_.* postag_regexp=yes /exception regexp=yes\p{Lu}+[\p{Ll}·]*/exceptionexception regexp=yes[\p{Ll}·]+(e|[aei]sses|[ae]res|era)/exception/token -token postag=V.* postag_regexp=yesexception postag=_GV_ //token +token postag=V.* postag_regexp=yesexception postag=_GV_|VMIP1S0 postag_regexp=yes //token /and /marker /pattern @@ -5125,6 +5125,18 @@ disambig action=filter postag=I / /rule /rulegroup +rulegroup id=interjeccio name=interjeccions +rule +pattern +token postag=SENT_START|CC postag_regexp=yes/token +marker +tokenvaja/token +/marker +token regexp=yes,|\.\.\.|\./token +/pattern +disambig action=filter postag=I / +/rule +/rulegroup rule id=PI_N name=pronom indefinit i nom pattern and Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/rules/ca/grammar.xml2012-07-27 22:18:47 UTC (rev 7764) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml2012-07-27 23:45:40 UTC (rev 7765) @@ -3051,10 +3051,8 @@ /pattern messageCal dir suggestionel match no=2/match/suggestion./message shortError ortogràfic/short -example type=incorrectmarkerl'iogurt/marker -/example -example type=correctmarkerel iogurt/marker -/example +example type=incorrectmarkerl'iogurt/marker/example +example type=correctmarkerel iogurt/marker/example /rule rule pattern @@ -3063,12 +3061,9 @@ /pattern messageCal dir suggestionla match no=2/match/suggestion./message shortError ortogràfic/short -example type=incorrectmarkerl'universitat/marker -/example -example type=correctmarkerla universitat/marker -/example +example type=incorrectmarkerl'universitat/marker/example +example type=correctmarkerla universitat/marker/example example type=correctl'intel·lectual valencià/example -example type=correctla intel·lectual valenciana/example /rule rule pattern @@ -3079,12 +3074,14 @@ token postag=_GN_MS / /and /marker -token postag=_GN_FS / +token postag=_GN_FSexception postag=_GN_MS//token /pattern messageCal dir suggestionla match no=2/match
[LanguageTool] SF.net SVN: languagetool:[7767] trunk/JLanguageTool/build.xml
Revision: 7767 http://languagetool.svn.sourceforge.net/languagetool/?rev=7767view=rev Author: jaumeortola Date: 2012-07-28 08:48:09 + (Sat, 28 Jul 2012) Log Message: --- [ja] Copy Japan resource file to distribution. This removes an error in LanguagetoolGUI. Modified Paths: -- trunk/JLanguageTool/build.xml Modified: trunk/JLanguageTool/build.xml === --- trunk/JLanguageTool/build.xml 2012-07-28 08:18:41 UTC (rev 7766) +++ trunk/JLanguageTool/build.xml 2012-07-28 08:48:09 UTC (rev 7767) @@ -664,6 +664,8 @@ copy file=${resource.dir}/ca/disambiguation.xml todir=${dist.dir}/resource/ca / copy file=${resource.dir}/ca/README todir=${dist.dir}/resource/ca / copy file=${resource.dir}/ca/ca.ngp todir=${dist.dir}/resource/ca / + + copy file=${resource.dir}/ja/ja.ngp todir=${dist.dir}/resource/ja / copy file=${resource.dir}/zh/coreDict.dct todir=${dist.dir}/resource/zh / copy file=${resource.dir}/zh/BigramDict.dct todir=${dist.dir}/resource/zh / This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[7772] trunk/JLanguageTool/src/rules/ca/grammar. xml
Revision: 7772 http://languagetool.svn.sourceforge.net/languagetool/?rev=7772view=rev Author: jaumeortola Date: 2012-07-29 06:55:14 + (Sun, 29 Jul 2012) Log Message: --- [ca] New rule: CONFUSIO_PARTICIPI_INFINITIU. Modified Paths: -- trunk/JLanguageTool/src/rules/ca/grammar.xml Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/rules/ca/grammar.xml2012-07-28 18:16:54 UTC (rev 7771) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml2012-07-29 06:55:14 UTC (rev 7772) @@ -1645,7 +1645,7 @@ example type=incorrectNo markercomposa/marker mai./example example type=correctNo markercompon/marker mai./example /rule -rule id=VAREM_INFINITIU name=Errors en el passat compost +rule id=VAREM_INFINITIU name=Errors d'accentuació en el passat compost (*varem/vàrem) pattern marker token regexp=yesvarem|vareu/token @@ -1657,6 +1657,19 @@ example type=incorrectmarkerVarem/marker dir./example example type=correctmarkerVàrem/marker dir./example /rule +rule id=CONFUSIO_PARTICIPI_INFINITIU name=Nom + adverbi + participi: un país secularment *humanitzar/humanitzat +pattern +token postag=N.[MC][SN].* postag_regexp=yes/ +token postag=RG/ +marker +token postag=V.[GN].* postag_regexp=yes/ +/marker +/pattern +messagePotser vols dir suggestionmatch no=3 postag=VMP00SM//suggestion./message +shortPossible confusió/short +example type=incorrectun país secularment markerhumanitzar/marker com el nostre/example +example type=correctun país secularment humanitzat com el nostre/example +/rule !-- Només funciona per a algunes situacions: van beguts, considerin oportú. rulegroup id=concorda_verb_objecte name=Comprova concordança: verb + participi/adjectiu rule pattern mark_from=0 mark_to=0 This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[7778] trunk/JLanguageTool/src
Revision: 7778 http://languagetool.svn.sourceforge.net/languagetool/?rev=7778view=rev Author: jaumeortola Date: 2012-07-29 17:58:29 + (Sun, 29 Jul 2012) Log Message: --- [ca] New rules: ves/v?\195?\169s, c?\195?\179rrer/anar/ser a c?\195?\160rrec de, (de) cara a. Disambiguation: enlaire (verb/adverb). Modified Paths: -- trunk/JLanguageTool/src/resource/ca/disambiguation.xml trunk/JLanguageTool/src/rules/ca/grammar.xml Modified: trunk/JLanguageTool/src/resource/ca/disambiguation.xml === --- trunk/JLanguageTool/src/resource/ca/disambiguation.xml 2012-07-29 17:56:45 UTC (rev ) +++ trunk/JLanguageTool/src/resource/ca/disambiguation.xml 2012-07-29 17:58:29 UTC (rev 7778) @@ -4665,8 +4665,19 @@ /marker /pattern disambig action=filter postag=[^V].*/disambig -/rule - +/rule +rule id=VerbAdverbi name=verb (sense pronoms) i adverbi +!-- mans enlaire, s'enlaire -- +pattern +marker +and +token postag=RG/ +token postag=V.[MSI].* postag_regexp=yes regexp=yesexception postag=_GV_ //token +/and +/marker +/pattern +disambig action=filter postag=[^V].*/disambig +/rule rule id=VerbNom name=verb i nom que no ha concordat !-- Això fou estrany -- pattern token postag=V.[MSI].*|_GV_ postag_regexp=yes negate_pos=yesexception postag=V.[MSI].*|_GV_ postag_regexp=yes//token Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/rules/ca/grammar.xml2012-07-29 17:56:45 UTC (rev ) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml2012-07-29 17:58:29 UTC (rev 7778) @@ -2678,12 +2678,12 @@ /rulegroup /category category name=Errors gramaticals -rule id=TOT_I name=tot i +rule id=TOT_I_GERUNDI name=tot i + *gerundi/infinitiu pattern tokentot/token tokeni/token marker -token postag=V.[^N].* postag_regexp=yes/token +token postag=V.G.* postag_regexp=yes/token /marker /pattern messageEl verb ha d'anar en infinitiu:suggestionmatch no=3 postag=V.N.* postag_regexp=yes/match/suggestion./message @@ -3137,8 +3137,64 @@ category name=Accents diacrítics rulegroup id=ACCENTS_DIACRITICS name=Comprova accents diacrítics diversos: rés, bé, és !--si que -- + rule +pattern +marker +tokenves/token +/marker +token negate=yes regexp=yesper|si|que/token +/pattern +messageS'accentua quan és del verb anar: suggestionvés/suggestion./message +shortS'accentua quan és del verb anar./short +example type=incorrectmarkerves/marker cap allà/example +example type=correctvés cap allà/example +example type=correctVes que no ho facis!/example +example type=correctVes si n'he tinguda, de mala sort./example +/rule rule pattern +marker +tokenves/token +/marker +tokenper/token +token negate=yeson/token +/pattern +messageS'accentua quan és del verb anar: suggestionvés/suggestion./message +shortS'accentua quan és del verb anar./short +example type=incorrectmarkerVes/marker per allà./example +example type=correctVés per allà./example +/rule +rule +pattern +marker +tokenves/token +/marker +tokenper/token +tokenon/token +token negate=yes,/token +/pattern +messageS'accentua quan és del verb anar: suggestionvés/suggestion./message +shortS'accentua quan és del verb anar./short +example type=incorrectmarkerVes/marker per on vulgues./example +example type=correctVes per on, això m'agrada./example +/rule +rule +pattern +marker +tokenvés/token +/marker +tokenper/token +tokenon/token +token,/token +/pattern +messageNo s'accentua quan és del verb veure: suggestionves/suggestion./message +shortNo s'accentua./short
[LanguageTool] SF.net SVN: languagetool:[7779] trunk/JLanguageTool/src
Revision: 7779 http://languagetool.svn.sourceforge.net/languagetool/?rev=7779view=rev Author: jaumeortola Date: 2012-07-30 00:07:57 + (Mon, 30 Jul 2012) Log Message: --- [ca] Fixed false alarms: es deixa caure, jo mateixa. Modified Paths: -- trunk/JLanguageTool/src/resource/ca/disambiguation.xml trunk/JLanguageTool/src/rules/ca/grammar.xml Modified: trunk/JLanguageTool/src/resource/ca/disambiguation.xml === --- trunk/JLanguageTool/src/resource/ca/disambiguation.xml 2012-07-29 17:58:29 UTC (rev 7778) +++ trunk/JLanguageTool/src/resource/ca/disambiguation.xml 2012-07-30 00:07:57 UTC (rev 7779) @@ -2044,6 +2044,19 @@ /pattern disambig action=filter postag=V.*/disambig /rule +rule id=PronomNom name=nom i pronom +!-- jo, mi, la, te, ens -- +pattern +tokenexception postag=D[AID].* postag_regexp=yes //token +marker +and +token postag=PP.* postag_regexp=yes/ +token postag=N.* postag_regexp=yes/ +/and +/marker +/pattern +disambig action=filter postag=[^N].*/disambig +/rule rulegroup id=DNA name=Det + Nom + Adj/Possessiu/participi !--Falla amb nom neutre?: Aquest art expressa -- Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/rules/ca/grammar.xml2012-07-29 17:58:29 UTC (rev 7778) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml2012-07-30 00:07:57 UTC (rev 7779) @@ -1092,7 +1092,7 @@ marker token postag=P0.* postag_regexp=yes skip=2exception postag=P[0P].*|V.[^MNGP].*|SENT_END scope=next postag_regexp=yes negate_pos=yes //token /marker -token postag=V.[^MNGP].* postag_regexp=yes skip=1exception scope=nextper/exception/token +token postag=V.[^MNGP].* postag_regexp=yes skip=1exception scope=nextper/exceptionexception inflected=yesdeixar/exception/token /unify token regexp=yescaure|callar|témer|marxar|albergar|olorar/token /pattern @@ -1104,6 +1104,7 @@ example type=incorrectTu markeret/marker pots caure./example example type=correctEl nen pot caure./example example type=correctEl nen et pot caure./example +example type=correctEs deixaven caure./example /rule !-- -- rule This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[7929] trunk/JLanguageTool
Revision: 7929 http://languagetool.svn.sourceforge.net/languagetool/?rev=7929view=rev Author: jaumeortola Date: 2012-08-26 21:49:04 + (Sun, 26 Aug 2012) Log Message: --- [ca] Rule improved: no cal confondre/cal no confondre Modified Paths: -- trunk/JLanguageTool/.classpath trunk/JLanguageTool/src/rules/ca/grammar.xml Modified: trunk/JLanguageTool/.classpath === --- trunk/JLanguageTool/.classpath 2012-08-26 15:01:19 UTC (rev 7928) +++ trunk/JLanguageTool/.classpath 2012-08-26 21:49:04 UTC (rev 7929) @@ -41,7 +41,6 @@ classpathentry kind=lib path=libs/lucene-analyzers-common-4.0.0-BETA.jar/ classpathentry kind=lib path=libs/lucene-sandbox-4.0.0-BETA.jar/ classpathentry kind=lib path=libs/junit-4.7.jar/ - classpathentry kind=lib path=libs/jakarta-regexp-1.4.jar/ classpathentry kind=lib path=libs/tika-core-0.9.jar/ classpathentry kind=lib path=libs/ictclas4j-1.0.jar/ classpathentry kind=lib path=libs/CJFtransform_v1.0.1_bin.jar/ Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/rules/ca/grammar.xml2012-08-26 15:01:19 UTC (rev 7928) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml2012-08-26 21:49:04 UTC (rev 7929) @@ -6444,15 +6444,16 @@ example type=correctNo tenia cap dubte que sí./example /rule /rulegroup -rule id=NO_CAL_OBLIDAR name=no cal oblidat/cal no oblidar +rule id=NO_CAL_OBLIDAR name=*no cal oblidar/cal no oblidar pattern tokenno/token token inflected=yescaldre/token -tokenoblidar/token +token regexp=yesoblidar|confondre/token /pattern messagePotser volíeu dir suggestionmatch no=2 / match no=1 case_conversion=alllower / match no=3 //suggestion./message shortSuggeriment/short example type=incorrectmarkerNo cal oblidar/marker que les coses són així./example +example type=incorrectmarkerNo cal confondre/marker les coses./example example type=correctmarkerCal no oblidar/marker que les coses són així./example /rule rule id=PAPER_SECANT name=paper secant This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[7930] trunk/JLanguageTool/src/rules/ca/grammar. xml
Revision: 7930 http://languagetool.svn.sourceforge.net/languagetool/?rev=7930view=rev Author: jaumeortola Date: 2012-08-26 22:36:29 + (Sun, 26 Aug 2012) Log Message: --- [ca] new rule: ACABAR + GERUNDI Modified Paths: -- trunk/JLanguageTool/src/rules/ca/grammar.xml Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/rules/ca/grammar.xml2012-08-26 21:49:04 UTC (rev 7929) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml2012-08-26 22:36:29 UTC (rev 7930) @@ -1257,6 +1257,18 @@ /rule /rulegroup rulegroup id=PERIFRASIS name=Perífrasis d'obligació i de dubte +rule id=ACABAR_GERUNDI name=*acabà fer/acabà fent +pattern +token inflected=yesacabar/token +marker +token postag=V.N.* postag_regexp=yes/token +/marker +/pattern +messagePerífrasi verbal incorrecta: suggestionmatch no=2 postag=(..)(.+) postag_regexp=yes postag_replace=$1G/match/suggestion./message +example type=incorrectVa acabar markerdedicar/marker-li l'obra./example +example type=correctAcabà dedicant-li l'obra./example +example type=correctPer acabar farem això./example +/rule rule id=HI_HA_QUE name=Incorrecte: «haver-hi que» pattern marker This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[7934] trunk/JLanguageTool/src/rules/ca/grammar. xml
Revision: 7934 http://languagetool.svn.sourceforge.net/languagetool/?rev=7934view=rev Author: jaumeortola Date: 2012-08-27 22:26:00 + (Mon, 27 Aug 2012) Log Message: --- [ca] new rules: cap els/cap als; possessius sense article. Fixed false alarms. Modified Paths: -- trunk/JLanguageTool/src/rules/ca/grammar.xml Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/rules/ca/grammar.xml2012-08-27 20:02:44 UTC (rev 7933) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml2012-08-27 22:26:00 UTC (rev 7934) @@ -1028,6 +1028,81 @@ /rule /rulegroup /category +category name=Possessius +rulegroup id=POSSESSIU_SENSE_ARTICLE name=possessiu sense article: de meua casa +rule +pattern +tokenexception postag=D[AIN].*|N.* postag_regexp=yes//token +marker +token regexp=yes[mts]e(u|us|ua|ues|va|ves)|[nv]ostr(a|es?)exception postag=LOC_ADV/exception regexp=yesseus?|nostr(e|a)/exception/token +/marker +token postag=N.* postag_regexp=yes/ +/pattern +messageFalta un article./message +example type=incorrectAixò és de markermeu/marker avi./example +example type=incorrectsón coneguts per markerseua/marker força/example +example type=correctAixò és del meu avi./example +example type=correcten la seva majoria/example +example type=correctLa mort i resurrecció de Nostre Senyor Jesucrist./example +example type=correcta la sortida de casa seva Francesc Layret/example +example type=correctcom a seu oficial dels Jocs/example +/rule +rule +pattern +tokenexception postag=D[AIN].*|N.* postag_regexp=yes//token +marker +token regexp=yesseus?exception postag=LOC_ADV//token +/marker +token postag=N.* postag_regexp=yesexception postag=A..[FC].*|V.P00.F postag_regexp=yes//token +/pattern +messageFalta un article./message +example type=incorrectAixò és de markerseu/marker avi./example +example type=correctcom a seu oficial dels Jocs/example +/rule +rule +pattern +tokenexception postag=D[AIN].* postag_regexp=yes//token +marker +token regexp=yes[mts]e(u|us|ua|ues|va|ves)|[nv]ostr(a|es?)exception postag=LOC_ADV/exception regexp=yesnostr(e|a)/exception/token +/marker +token postag=A.*|V.P.* postag_regexp=yes/ +token postag=N.* postag_regexp=yes/ +/pattern +messageFalta un article./message +example type=incorrectdesplaçant markerseus/marker anteriors alfabets/example +example type=correctdesplaçant els seus anteriors alfabets/example +example type=correctPublica la Passió de Nostre Senyor Jesucrist./example +/rule +rule +pattern +tokenexception postag=D[AIN].*|N.* postag_regexp=yes//token +marker +token regexp=yesnostr(a|e)exception postag=LOC_ADV//token +/marker +token postag=N.* postag_regexp=yesexception regexp=yes(?-i)(Senyora?|Pare)/exception/token +/pattern +messageFalta un article./message +example type=incorrectAixò és de markernostre/marker pare./example +example type=incorrectsemblant a markernostre/marker terme actual./example +example type=correctAixò és del nostre pare./example +example type=correctLa mort i resurrecció de Nostre Pare./example +/rule +rule +pattern +tokenexception postag=D[AIN].*|N.* postag_regexp=yes//token +marker +token regexp=yesnostr(a|e)exception postag=LOC_ADV//token +/marker +token postag=A.*|V.P.* postag_regexp=yesexception regexp=yes(?-i)Senyora?/exception/token +token postag=N.* postag_regexp=yes/ +/pattern +messageFalta un article./message +example type=incorrectAixò és de markernostre/marker estimat avi./example +example type=correctLa mort i resurrecció de Nostre Senyor Jesucrist./example +/rule + +/rulegroup +/category category name
[LanguageTool] SF.net SVN: languagetool:[7935] trunk/JLanguageTool/src/rules/ca/grammar. xml
Revision: 7935 http://languagetool.svn.sourceforge.net/languagetool/?rev=7935view=rev Author: jaumeortola Date: 2012-08-28 12:00:19 + (Tue, 28 Aug 2012) Log Message: --- [ca] new rule: *cap el(s)/ cap al(s) Modified Paths: -- trunk/JLanguageTool/src/rules/ca/grammar.xml Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/rules/ca/grammar.xml2012-08-27 22:26:00 UTC (rev 7934) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml2012-08-28 12:00:19 UTC (rev 7935) @@ -2085,15 +2085,37 @@ /category category name=Preposicions rule id=CAP_ELS_CAP_ALS name=*cap els/cap als -!-- Falten excepcions... -- +!-- Falten excepcions!! -- pattern -tokencap/token -tokenels/token +token negate=yesaexception postag=V.* postag_regexp=yes inflected=yesfer/exception/token +marker +tokencapexception postag=_GN_.* postag_regexp=yes//token +tokenels/token +/marker /pattern messageVolíeu dir suggestioncap als/suggestion?/message example type=incorrectla confiança markercap els/marker partits/example example type=correctla confiança cap als partits/example +example type=correctque portaren a cap els comtes/example +example type=correcton fan cap els comtes/example +example type=correcttocar amb el cap els esquís de la gent/example /rule +rule id=CAP_EL_CAP_AL name=*cap el/cap al +!-- Falten excepcions!! -- +pattern +token negate=yesaexception postag=V.* postag_regexp=yes inflected=yesfer/exception/token +marker +tokencapexception postag=_GN_.* postag_regexp=yes//token +tokenel/token +/marker +/pattern +messageVolíeu dir suggestioncap al/suggestion?/message +example type=incorrectla confiança markercap el/marker partit/example +example type=correctla confiança cap al partit/example +example type=correctque tingué com a cap el Comte d'Espanya/example +example type=correcton fa cap el Comte/example +example type=correctla Colònia del Cap el 1788/example +/rule rulegroup id=DACI_A name=d'ací a rule pattern This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[7943] trunk/JLanguageTool/src/rules/ca/grammar. xml
Revision: 7943 http://languagetool.svn.sourceforge.net/languagetool/?rev=7943view=rev Author: jaumeortola Date: 2012-08-29 11:42:18 + (Wed, 29 Aug 2012) Log Message: --- [ca] new rule: *apart/a part Modified Paths: -- trunk/JLanguageTool/src/rules/ca/grammar.xml Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/rules/ca/grammar.xml2012-08-29 06:33:59 UTC (rev 7942) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml2012-08-29 11:42:18 UTC (rev 7943) @@ -1317,7 +1317,7 @@ example type=correctNo vaig markertelefonar-li/marker/example /rule /rulegroup -rulegroup id=cabre name=cabre (incorrecte) +rulegroup id=cabre name=*cabre + infinitiu rule pattern marker @@ -5645,6 +5645,21 @@ /rule /category category name=Expressions +rulegroup id=APART name=*apart/a part +rule +pattern +tokenexception postag=D[DAI]0[MC]S0 postag_regexp=yes//token +marker +tokenapart/token +/marker +/pattern +message¿Volíeu dir suggestiona part/suggestion?/message +example type=incorrectmarkerApart/marker del nostre país/example +example type=incorrectDeixant markerapart/marker l'estil dels trobadors/example +example type=correctA part del nostre país/example +example type=correctLlavors va fer un apart/example +/rule +/rulegroup rule id=CARA_A name=*cara a/de cara a pattern token negate=yes inflected=yes regexp=yesplantar|ferexception regexp=yesde|la/exception/token This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[7944] trunk/JLanguageTool/src
Revision: 7944 http://languagetool.svn.sourceforge.net/languagetool/?rev=7944view=rev Author: jaumeortola Date: 2012-08-29 14:30:16 + (Wed, 29 Aug 2012) Log Message: --- [ca] new rule: *un a/una Modified Paths: -- trunk/JLanguageTool/src/resource/ca/multiwords.txt trunk/JLanguageTool/src/rules/ca/grammar.xml Modified: trunk/JLanguageTool/src/resource/ca/multiwords.txt === --- trunk/JLanguageTool/src/resource/ca/multiwords.txt 2012-08-29 11:42:18 UTC (rev 7943) +++ trunk/JLanguageTool/src/resource/ca/multiwords.txt 2012-08-29 14:30:16 UTC (rev 7944) @@ -25,6 +25,8 @@ a la fiLOC_ADV a la vegadaLOC_ADV A la vegadaLOC_ADV +A mesura que LOC_CONJ +a mesura que LOC_CONJ A més LOC_ADV a més LOC_ADV a més a mésLOC_ADV @@ -309,6 +311,8 @@ en general LOC_ADV En gran part LOC_ADV en gran part LOC_ADV +En la mesura que LOC_CONJ +en la mesura que LOC_CONJ En la seua majoria LOC_ADV en la seua majoria LOC_ADV en la seva majoria LOC_ADV Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/rules/ca/grammar.xml2012-08-29 11:42:18 UTC (rev 7943) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml2012-08-29 14:30:16 UTC (rev 7944) @@ -2339,6 +2339,34 @@ /rulegroup /category category name=Confusions +rule id=UN_A name=*un a/una +pattern +marker +token regexp=yesalgun|aquest|un/token +tokena/token +/marker +token postag=NC[FC]S.*|A..[FC]S.*|V.P00SF postag_regexp=yesexceptionsota/exception/token +/pattern +message¿Volíeu dir suggestionmatch no=1/match no=2//suggestion?/message +example type=incorrectmarkeralgun a/marker cosa/example +example type=correctalguna cosa/example +example type=correctL'augment d'aquest a mesura que creix l'altre./example +/rule +rulegroup id=APART name=*apart/a part +rule +pattern +tokenexception postag=D[DAI]0[MC]S0 postag_regexp=yes//token +marker +tokenapart/token +/marker +/pattern +message¿Volíeu dir suggestiona part/suggestion?/message +example type=incorrectmarkerApart/marker del nostre país/example +example type=incorrectDeixant markerapart/marker l'estil dels trobadors/example +example type=correctA part del nostre país/example +example type=correctLlavors va fer un apart/example +/rule +/rulegroup rulegroup id=MOL_MOLT name=*mol(s)/molt(s) rule pattern @@ -5645,21 +5673,6 @@ /rule /category category name=Expressions -rulegroup id=APART name=*apart/a part -rule -pattern -tokenexception postag=D[DAI]0[MC]S0 postag_regexp=yes//token -marker -tokenapart/token -/marker -/pattern -message¿Volíeu dir suggestiona part/suggestion?/message -example type=incorrectmarkerApart/marker del nostre país/example -example type=incorrectDeixant markerapart/marker l'estil dels trobadors/example -example type=correctA part del nostre país/example -example type=correctLlavors va fer un apart/example -/rule -/rulegroup rule id=CARA_A name=*cara a/de cara a pattern token negate=yes inflected=yes regexp=yesplantar|ferexception regexp=yesde|la/exception/token @@ -7015,8 +7028,8 @@ /rule /rulegroup /category -!-- category name=Sintaxi -rulegroup id=ordre_dubtos name=ordres de frase dubtosos +!--category name=Sintaxi + rulegroup id=ordre_dubtos name=ordres de frase dubtosos rule pattern token postag=DA.* postag_regexp=yes/ This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs mailing list Languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[7945] trunk/JLanguageTool/src/rules/ca/grammar. xml
Revision: 7945 http://languagetool.svn.sourceforge.net/languagetool/?rev=7945view=rev Author: jaumeortola Date: 2012-08-29 17:28:08 + (Wed, 29 Aug 2012) Log Message: --- [ca] new rule: un any *despr?\195?\168s/despr?\195?\169s Modified Paths: -- trunk/JLanguageTool/src/rules/ca/grammar.xml Modified: trunk/JLanguageTool/src/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/rules/ca/grammar.xml2012-08-29 14:30:16 UTC (rev 7944) +++ trunk/JLanguageTool/src/rules/ca/grammar.xml2012-08-29 17:28:08 UTC (rev 7945) @@ -2339,6 +2339,44 @@ /rulegroup /category category name=Confusions +rulegroup id=DESPRES name=un any *desprès/després +!-- Possible false alarms: és molt desprès (generós); un home desprès... -- +rule +pattern +token negate=yes inflected=yeshaver/token +marker +tokendesprès/token +/marker +/pattern +message¿Volíeu dir suggestiondesprés/suggestion?/message +example type=incorrectuns anys markerdesprès/marker/example +example type=correctuns anys després/example +example type=corrects'ha desprès de tot/example +/rule +!-- rule +pattern +token postag=NC.* postag_regexp=yes inflected=yes regexp=yessegon|minut|hora|dia|setmana|mes|(tri|quadri|se)mestre|any|lustre|dècada|segle|mil·leni|moment|instant|temps/token +marker +tokendesprès/token +/marker +/pattern +message¿Volíeu dir suggestiondesprés/suggestion?/message +example type=incorrectuns markeranys desprès/marker/example +example type=correctuns anys després/example +/rule +rule +pattern +marker +tokendesprès/token +/marker +token regexp=yesde|d'/token +token postag=V.N.* postag_regexp=yes/ +/pattern +message¿Volíeu dir suggestiondesprés/suggestion?/message +example type=incorrectmarkerdesprès de cantar/marker/example +example type=correctdesprés de cantar/example +/rule -- +/rulegroup rule id=UN_A name=*un a/una pattern marker This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[8011] trunk/JLanguageTool/src
Revision: 8011 http://languagetool.svn.sourceforge.net/languagetool/?rev=8011view=rev Author: jaumeortola Date: 2012-09-09 17:43:06 + (Sun, 09 Sep 2012) Log Message: --- [ca] New Java rule: CATALAN_WRONG_WORD_IN_CONTEXT Modified Paths: -- trunk/JLanguageTool/src/main/java/org/languagetool/language/Catalan.java trunk/JLanguageTool/src/main/resources/org/languagetool/rules/ca/grammar.xml Added Paths: --- trunk/JLanguageTool/src/main/java/org/languagetool/rules/ca/CatalanWrongWordInContextRule.java trunk/JLanguageTool/src/main/resources/org/languagetool/rules/ca/wrongWordInContext.txt trunk/JLanguageTool/src/test/java/org/languagetool/rules/ca/CatalanWrongWordInContextRuleTest.java Modified: trunk/JLanguageTool/src/main/java/org/languagetool/language/Catalan.java === --- trunk/JLanguageTool/src/main/java/org/languagetool/language/Catalan.java 2012-09-09 13:57:14 UTC (rev 8010) +++ trunk/JLanguageTool/src/main/java/org/languagetool/language/Catalan.java 2012-09-09 17:43:06 UTC (rev 8011) @@ -36,6 +36,7 @@ import org.languagetool.rules.ca.CatalanUnpairedQuestionMarksRule; import org.languagetool.rules.ca.ComplexAdjectiveConcordanceRule; import org.languagetool.rules.ca.MorfologikCatalanSpellerRule; +import org.languagetool.rules.ca.CatalanWrongWordInContextRule; import org.languagetool.rules.patterns.Unifier; import org.languagetool.synthesis.Synthesizer; import org.languagetool.synthesis.ca.CatalanSynthesizer; @@ -44,14 +45,14 @@ import org.languagetool.tagging.disambiguation.Disambiguator; import org.languagetool.tagging.disambiguation.ca.CatalanHybridDisambiguator; import org.languagetool.tokenizers.SRXSentenceTokenizer; -import org.languagetool.tokenizers.SentenceTokenizer; +//import org.languagetool.tokenizers.SentenceTokenizer; import org.languagetool.tokenizers.Tokenizer; import org.languagetool.tokenizers.ca.CatalanWordTokenizer; public class Catalan extends Language { private Tagger tagger; - private SentenceTokenizer sentenceTokenizer; + //private SentenceTokenizer sentenceTokenizer; private Tokenizer wordTokenizer; private Synthesizer synthesizer; private Disambiguator disambiguator; @@ -107,7 +108,8 @@ CatalanUnpairedQuestionMarksRule.class, CatalanUnpairedExclamationMarksRule.class, AccentuationCheckRule.class, -ComplexAdjectiveConcordanceRule.class +ComplexAdjectiveConcordanceRule.class, +CatalanWrongWordInContextRule.class //CastellanismesReplaceRule.class, //AccentuacioReplaceRule.class ); @@ -129,13 +131,13 @@ return synthesizer; } - @Override - public final SentenceTokenizer getSentenceTokenizer() { -if (sentenceTokenizer == null) { - sentenceTokenizer = new SRXSentenceTokenizer(this); -} -return sentenceTokenizer; - } +// @Override +// public final SentenceTokenizer getSentenceTokenizer() { +//if (sentenceTokenizer == null) { +// sentenceTokenizer = new SRXSentenceTokenizer(this); +//} +//return sentenceTokenizer; +// } @Override public Unifier getUnifier() { Added: trunk/JLanguageTool/src/main/java/org/languagetool/rules/ca/CatalanWrongWordInContextRule.java === --- trunk/JLanguageTool/src/main/java/org/languagetool/rules/ca/CatalanWrongWordInContextRule.java (rev 0) +++ trunk/JLanguageTool/src/main/java/org/languagetool/rules/ca/CatalanWrongWordInContextRule.java 2012-09-09 17:43:06 UTC (rev 8011) @@ -0,0 +1,67 @@ +/* LanguageTool, a natural language style checker + * Copyright (C) 2012 Markus Brenneis + * + * This library is free software; you can redistribute it and/or + * modify it under the terms of the GNU Lesser General Public + * License as published by the Free Software Foundation; either + * version 2.1 of the License, or (at your option) any later version. + * + * This library is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Lesser General Public License for more details. + * + * You should have received a copy of the GNU Lesser General Public + * License along with this library; if not, write to the Free Software + * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 + * USA + */ +package org.languagetool.rules.ca; + +import java.io.IOException; +import java.util.ResourceBundle; + +import org.languagetool.rules.WrongWordInContextRule; + +public class CatalanWrongWordInContextRule extends WrongWordInContextRule { + + public CatalanWrongWordInContextRule(final ResourceBundle messages) throws IOException { +super(messages); + } + + @Override + protected String
[LanguageTool] SF.net SVN: languagetool:[8012] trunk/JLanguageTool/.classpath
Revision: 8012 http://languagetool.svn.sourceforge.net/languagetool/?rev=8012view=rev Author: jaumeortola Date: 2012-09-09 17:49:33 + (Sun, 09 Sep 2012) Log Message: --- .classpath file for Eclipse. Modified Paths: -- trunk/JLanguageTool/.classpath Modified: trunk/JLanguageTool/.classpath === --- trunk/JLanguageTool/.classpath 2012-09-09 17:43:06 UTC (rev 8011) +++ trunk/JLanguageTool/.classpath 2012-09-09 17:49:33 UTC (rev 8012) @@ -1,9 +1,15 @@ ?xml version=1.0 encoding=UTF-8? classpath - classpathentry kind=src path=src/main/java/ - classpathentry kind=src path=src/main/resources/ classpathentry kind=src path=src/main/dev/ + classpathentry kind=src path=src/test/resources/ classpathentry kind=src path=src/test/java/ + classpathentry kind=src path=src/main/resources/ + classpathentry kind=src path=src/main/java/ + classpathentry excluding=test/|dev/|java/|main/java/|main/resources/|main/dev/|test/java/|test/|test/java/|test/|test/resources/|test/java/ kind=src path=src + attributes + attribute name=org.eclipse.jdt.launching.CLASSPATH_ATTR_LIBRARY_PATH_ENTRY value=JLanguageTool/libs/ + /attributes + /classpathentry classpathentry kind=src path=libs/native-lib/ classpathentry kind=lib path=libs/build/junit.jar sourcepath=C:/Users/user/.m2/repository/junit/junit/4.8.2/junit-4.8.2-sources.jar attributes This was sent by the SourceForge.net collaborative development platform, the world's largest Open Source development site. -- Live Security Virtual Conference Exclusive live event will cover all the ways today's security and threat landscape has changed and how IT managers can respond. Discussions will include endpoint security, mobile security and the latest in malware threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/ ___ Languagetool-cvs mailing list Languagetool-cvs@lists.sourceforge.net https://lists.sourceforge.net/lists/listinfo/languagetool-cvs
[LanguageTool] SF.net SVN: languagetool:[8054] trunk/JLanguageTool/src/main/resources/org/ languagetool
Revision: 8054 http://languagetool.svn.sourceforge.net/languagetool/?rev=8054view=rev Author: jaumeortola Date: 2012-09-15 21:40:23 + (Sat, 15 Sep 2012) Log Message: --- [ca] new rules Modified Paths: -- trunk/JLanguageTool/src/main/resources/org/languagetool/resource/ca/disambiguation.xml trunk/JLanguageTool/src/main/resources/org/languagetool/rules/ca/grammar.xml Modified: trunk/JLanguageTool/src/main/resources/org/languagetool/resource/ca/disambiguation.xml === --- trunk/JLanguageTool/src/main/resources/org/languagetool/resource/ca/disambiguation.xml 2012-09-15 14:55:51 UTC (rev 8053) +++ trunk/JLanguageTool/src/main/resources/org/languagetool/resource/ca/disambiguation.xml 2012-09-15 21:40:23 UTC (rev 8054) @@ -729,7 +729,7 @@ token postag=VM[IS]P1S0 postag_regexp=yes / /marker /pattern -disambig action=filter postag=VM[IS]P1S0 / +disambig action=filter postag=V.[IS]P1S0 / /rule rule pattern @@ -739,7 +739,7 @@ token postag=VM[IS]P1S0 postag_regexp=yes / /marker /pattern -disambig action=filter postag=VM[IS]P1S0 / +disambig action=filter postag=V.[IS]P1S0 / /rule rule pattern @@ -750,7 +750,7 @@ token postag=VM[IS]P1S0 postag_regexp=yes / /marker /pattern -disambig action=filter postag=VM[IS]P1S0 / +disambig action=filter postag=V.[IS]P1S0 / /rule rule !-- un cop, aquestes tres -- @@ -2027,9 +2027,7 @@ token postag=V.N.* postag_regexp=yes/token /marker /pattern -disambig -match no=2 postag_regexp=yes postag=V.N.*/match -/disambig +disambigmatch no=2 postag_regexp=yes postag=V.N.*/match/disambig /rule rule pattern @@ -2038,8 +2036,7 @@ /marker token postag=V.N.* postag_regexp=yes/token /pattern -disambig action=addwd pos=_GV_/wd -/disambig +disambig action=addwd pos=_GV_/wd/disambig /rule rule pattern Modified: trunk/JLanguageTool/src/main/resources/org/languagetool/rules/ca/grammar.xml === --- trunk/JLanguageTool/src/main/resources/org/languagetool/rules/ca/grammar.xml 2012-09-15 14:55:51 UTC (rev 8053) +++ trunk/JLanguageTool/src/main/resources/org/languagetool/rules/ca/grammar.xml 2012-09-15 21:40:23 UTC (rev 8054) @@ -1026,7 +1026,23 @@ example type=incorrectmarkerles principals ganivets/marker./example example type=correctels principals ganivets./example /rule -/rulegroup +/rulegroup +rule id=LA_PENDENT name=*la/el pendent +!-- Cal un tractament especial perquè pendent és nom i adjectiu. ¿Passa igual amb altres paraules? -- +pattern +tokenexception postag=NCF.000 postag_regexp=yes//token +token postag=_GN_F. postag_regexp=yes regexp=yespendents?/token +/pattern +message'Pendent' és un nom masculí/message +shortÉs nom masculí/short +example type=incorrecten markerla pendent/marker descendent dels últims anys./example +example type=correcten el pendent descendent dels últims anys./example +example type=correctLa reforma pendent./example +example type=incorrectHi ha una markerforta pendent/marker./example +example type=correctHi ha un fort pendent./example +example type=incorrectla manca d'aigua en markerles pendents/marker superiors/example +example type=correctSón reptes pendents./example +/rule /category category name=Possessius rulegroup id=POSSESSIU_SENSE_ARTICLE name=possessiu sense article: de meua casa @@ -2211,31 +2227,123 @@ marker tokentan/token /marker -token postag=AQ.*|V.P.* postag_regexp=yes skip=10/ +token postag=AQ.[MC][SN].*|V.P.*SM postag_regexp=yes skip=10/ tokencom/token -token postag=AQ.*|V.P.* postag_regexp=yes/ +token postag=AQ.[MC][SN].*|V.P.*SM postag_regexp=yes/ /pattern messageHauria de ser: suggestiontant/suggestion./message shortConfusió./short +example type=incorrectmarkertan/marker físic com estètic./example +example type=correctTant físic com estètic./example