Revision: 7589
http://languagetool.svn.sourceforge.net/languagetool/?rev=7589&view=rev
Author: milek_pl
Date: 2012-06-30 17:51:13 +0000 (Sat, 30 Jun 2012)
Log Message:
-----------
update morfologikspeller to utf-8 version, and include one utf-8 dictionary as
an example
Modified Paths:
--------------
trunk/JLanguageTool/libs/morfologik-speller-1.5.4.jar
trunk/JLanguageTool/src/java/org/languagetool/language/Malayalam.java
Added Paths:
-----------
trunk/JLanguageTool/src/java/org/languagetool/rules/ml/
trunk/JLanguageTool/src/java/org/languagetool/rules/ml/MorfologikMalayalamSpellerRule.java
trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.dict
trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.info
trunk/JLanguageTool/src/test/org/languagetool/rules/ml/
trunk/JLanguageTool/src/test/org/languagetool/rules/ml/MorfologikMalayalamSpellerRuleTest.java
Removed Paths:
-------------
trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.aff
trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.dic
Modified: trunk/JLanguageTool/libs/morfologik-speller-1.5.4.jar
===================================================================
(Binary files differ)
Modified: trunk/JLanguageTool/src/java/org/languagetool/language/Malayalam.java
===================================================================
--- trunk/JLanguageTool/src/java/org/languagetool/language/Malayalam.java
2012-06-30 17:39:03 UTC (rev 7588)
+++ trunk/JLanguageTool/src/java/org/languagetool/language/Malayalam.java
2012-06-30 17:51:13 UTC (rev 7589)
@@ -30,7 +30,7 @@
import org.languagetool.rules.UppercaseSentenceStartRule;
import org.languagetool.rules.WhitespaceRule;
import org.languagetool.rules.WordRepeatRule;
-import org.languagetool.rules.spelling.hunspell.HunspellNoSuggestionRule;
+import org.languagetool.rules.ml.MorfologikMalayalamSpellerRule;
import org.languagetool.tagging.Tagger;
import org.languagetool.tagging.ml.MalayalamTagger;
import org.languagetool.tokenizers.SRXSentenceTokenizer;
@@ -100,7 +100,7 @@
CommaWhitespaceRule.class,
DoublePunctuationRule.class,
GenericUnpairedBracketsRule.class,
- HunspellNoSuggestionRule.class,
+ MorfologikMalayalamSpellerRule.class,
UppercaseSentenceStartRule.class,
WordRepeatRule.class,
WhitespaceRule.class
Added:
trunk/JLanguageTool/src/java/org/languagetool/rules/ml/MorfologikMalayalamSpellerRule.java
===================================================================
---
trunk/JLanguageTool/src/java/org/languagetool/rules/ml/MorfologikMalayalamSpellerRule.java
(rev 0)
+++
trunk/JLanguageTool/src/java/org/languagetool/rules/ml/MorfologikMalayalamSpellerRule.java
2012-06-30 17:51:13 UTC (rev 7589)
@@ -0,0 +1,45 @@
+/* LanguageTool, a natural language style checker
+ * Copyright (C) 2012 Marcin Miłkowski (http://www.languagetool.org)
+ *
+ * This library is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2.1 of the License, or (at your option) any later version.
+ *
+ * This library is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with this library; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301
+ * USA
+ */
+
+package org.languagetool.rules.ml;
+
+import java.util.ResourceBundle;
+
+import org.languagetool.Language;
+import org.languagetool.rules.spelling.morfologik.MorfologikSpellerRule;
+
+public final class MorfologikMalayalamSpellerRule extends
MorfologikSpellerRule {
+
+ private static final String RESOURCE_FILENAME = "/ml/hunspell/ml_IN.dict";
+
+ public MorfologikMalayalamSpellerRule(ResourceBundle messages,
+ Language language) {
+ super(messages, language);
+ }
+
+ @Override
+ public String getFileName() {
+ return RESOURCE_FILENAME;
+ }
+
+ public String getId() {
+ return "MORFOLOGIK_RULE_ML_IN";
+ }
+
+}
Property changes on:
trunk/JLanguageTool/src/java/org/languagetool/rules/ml/MorfologikMalayalamSpellerRule.java
___________________________________________________________________
Added: svn:mime-type
+ text/plain
Deleted: trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.aff
===================================================================
--- trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.aff 2012-06-30
17:39:03 UTC (rev 7588)
+++ trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.aff 2012-06-30
17:51:13 UTC (rev 7589)
@@ -1 +0,0 @@
-SET UTF-8
Deleted: trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.dic
===================================================================
(Binary files differ)
Added: trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.dict
===================================================================
(Binary files differ)
Property changes on: trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.dict
___________________________________________________________________
Added: svn:mime-type
+ application/octet-stream
Added: trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.info
===================================================================
--- trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.info
(rev 0)
+++ trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.info 2012-06-30
17:51:13 UTC (rev 7589)
@@ -0,0 +1,9 @@
+#
+# Dictionary properties.
+#
+
+fsa.dict.separator=+
+fsa.dict.encoding=utf-8
+
+fsa.dict.uses-prefixes=false
+fsa.dict.uses-infixes=false
\ No newline at end of file
Added:
trunk/JLanguageTool/src/test/org/languagetool/rules/ml/MorfologikMalayalamSpellerRuleTest.java
===================================================================
---
trunk/JLanguageTool/src/test/org/languagetool/rules/ml/MorfologikMalayalamSpellerRuleTest.java
(rev 0)
+++
trunk/JLanguageTool/src/test/org/languagetool/rules/ml/MorfologikMalayalamSpellerRuleTest.java
2012-06-30 17:51:13 UTC (rev 7589)
@@ -0,0 +1,52 @@
+package org.languagetool.rules.ml;
+
+import static org.junit.Assert.assertEquals;
+
+import java.io.IOException;
+
+import org.junit.Test;
+import org.languagetool.JLanguageTool;
+import org.languagetool.Language;
+import org.languagetool.TestTools;
+import org.languagetool.rules.RuleMatch;
+
+public class MorfologikMalayalamSpellerRuleTest {
+
+ @Test
+ public void testMorfologikSpeller() throws IOException {
+ MorfologikMalayalamSpellerRule rule =
+ new MorfologikMalayalamSpellerRule
(TestTools.getMessages("Malayalam"), Language.MALAYALAM);
+
+ RuleMatch[] matches;
+ JLanguageTool langTool = new JLanguageTool(Language.MALAYALAM);
+
+
+ // correct sentences:
+ assertEquals(0, rule.match(langTool.getAnalyzedSentence("എന്തുകൊണ്ട്
അംഗത്വം")).length);
+ assertEquals(0, rule.match(langTool.getAnalyzedSentence("എങ്ങനെ
അംഗമാകാം?")).length);
+ //test for "LanguageTool":
+ assertEquals(0,
rule.match(langTool.getAnalyzedSentence("LanguageTool")).length);
+ assertEquals(0, rule.match(langTool.getAnalyzedSentence(",")).length);
+ assertEquals(0,
rule.match(langTool.getAnalyzedSentence("123454")).length);
+
+ //incorrect sentences:
+
+ matches = rule.match(langTool.getAnalyzedSentence("Zolw"));
+ // check match positions:
+ assertEquals(1, matches.length);
+ assertEquals(0, matches[0].getFromPos());
+ assertEquals(4, matches[0].getToPos());
+ assertEquals(matches[0].getSuggestedReplacements().isEmpty(), true);
+
+ matches = rule.match(langTool.getAnalyzedSentence("എaങ്ങനെ"));
+ assertEquals(1, matches.length);
+ assertEquals(0, matches[0].getFromPos());
+ assertEquals(7, matches[0].getToPos());
+ assertEquals(matches[0].getSuggestedReplacements().get(0), "എങ്ങനെ");
+
+ assertEquals(1,
rule.match(langTool.getAnalyzedSentence("aõh")).length);
+ assertEquals(1, rule.match(langTool.getAnalyzedSentence("a")).length);
+
+ }
+
+}
Property changes on:
trunk/JLanguageTool/src/test/org/languagetool/rules/ml/MorfologikMalayalamSpellerRuleTest.java
___________________________________________________________________
Added: svn:mime-type
+ text/plain
This was sent by the SourceForge.net collaborative development platform, the
world's largest Open Source development site.
------------------------------------------------------------------------------
Live Security Virtual Conference
Exclusive live event will cover all the ways today's security and
threat landscape has changed and how IT managers can respond. Discussions
will include endpoint security, mobile security and the latest in malware
threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/
_______________________________________________
Languagetool-cvs mailing list
[email protected]
https://lists.sourceforge.net/lists/listinfo/languagetool-cvs