Revision: 7589
          
http://languagetool.svn.sourceforge.net/languagetool/?rev=7589&view=rev
Author:   milek_pl
Date:     2012-06-30 17:51:13 +0000 (Sat, 30 Jun 2012)
Log Message:
-----------
update morfologikspeller to utf-8 version, and include one utf-8 dictionary as 
an example

Modified Paths:
--------------
    trunk/JLanguageTool/libs/morfologik-speller-1.5.4.jar
    trunk/JLanguageTool/src/java/org/languagetool/language/Malayalam.java

Added Paths:
-----------
    trunk/JLanguageTool/src/java/org/languagetool/rules/ml/
    
trunk/JLanguageTool/src/java/org/languagetool/rules/ml/MorfologikMalayalamSpellerRule.java
    trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.dict
    trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.info
    trunk/JLanguageTool/src/test/org/languagetool/rules/ml/
    
trunk/JLanguageTool/src/test/org/languagetool/rules/ml/MorfologikMalayalamSpellerRuleTest.java

Removed Paths:
-------------
    trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.aff
    trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.dic

Modified: trunk/JLanguageTool/libs/morfologik-speller-1.5.4.jar
===================================================================
(Binary files differ)

Modified: trunk/JLanguageTool/src/java/org/languagetool/language/Malayalam.java
===================================================================
--- trunk/JLanguageTool/src/java/org/languagetool/language/Malayalam.java       
2012-06-30 17:39:03 UTC (rev 7588)
+++ trunk/JLanguageTool/src/java/org/languagetool/language/Malayalam.java       
2012-06-30 17:51:13 UTC (rev 7589)
@@ -30,7 +30,7 @@
 import org.languagetool.rules.UppercaseSentenceStartRule;
 import org.languagetool.rules.WhitespaceRule;
 import org.languagetool.rules.WordRepeatRule;
-import org.languagetool.rules.spelling.hunspell.HunspellNoSuggestionRule;
+import org.languagetool.rules.ml.MorfologikMalayalamSpellerRule;
 import org.languagetool.tagging.Tagger;
 import org.languagetool.tagging.ml.MalayalamTagger;
 import org.languagetool.tokenizers.SRXSentenceTokenizer;
@@ -100,7 +100,7 @@
             CommaWhitespaceRule.class,
             DoublePunctuationRule.class,
             GenericUnpairedBracketsRule.class,
-            HunspellNoSuggestionRule.class,
+            MorfologikMalayalamSpellerRule.class,
             UppercaseSentenceStartRule.class,
             WordRepeatRule.class,
             WhitespaceRule.class

Added: 
trunk/JLanguageTool/src/java/org/languagetool/rules/ml/MorfologikMalayalamSpellerRule.java
===================================================================
--- 
trunk/JLanguageTool/src/java/org/languagetool/rules/ml/MorfologikMalayalamSpellerRule.java
                          (rev 0)
+++ 
trunk/JLanguageTool/src/java/org/languagetool/rules/ml/MorfologikMalayalamSpellerRule.java
  2012-06-30 17:51:13 UTC (rev 7589)
@@ -0,0 +1,45 @@
+/* LanguageTool, a natural language style checker 
+ * Copyright (C) 2012 Marcin Miłkowski (http://www.languagetool.org)
+ * 
+ * This library is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2.1 of the License, or (at your option) any later version.
+ *
+ * This library is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with this library; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA  02110-1301
+ * USA
+ */
+
+package org.languagetool.rules.ml;
+
+import java.util.ResourceBundle;
+
+import org.languagetool.Language;
+import org.languagetool.rules.spelling.morfologik.MorfologikSpellerRule;
+
+public final class MorfologikMalayalamSpellerRule extends 
MorfologikSpellerRule {
+
+    private static final String RESOURCE_FILENAME = "/ml/hunspell/ml_IN.dict";
+    
+    public MorfologikMalayalamSpellerRule(ResourceBundle messages,
+            Language language) {
+        super(messages, language);
+    }
+
+    @Override
+    public String getFileName() {
+        return RESOURCE_FILENAME;
+    }
+    
+    public String getId() {
+        return "MORFOLOGIK_RULE_ML_IN";
+    }
+
+}


Property changes on: 
trunk/JLanguageTool/src/java/org/languagetool/rules/ml/MorfologikMalayalamSpellerRule.java
___________________________________________________________________
Added: svn:mime-type
   + text/plain

Deleted: trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.aff
===================================================================
--- trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.aff      2012-06-30 
17:39:03 UTC (rev 7588)
+++ trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.aff      2012-06-30 
17:51:13 UTC (rev 7589)
@@ -1 +0,0 @@
-SET UTF-8

Deleted: trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.dic
===================================================================
(Binary files differ)

Added: trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.dict
===================================================================
(Binary files differ)


Property changes on: trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.dict
___________________________________________________________________
Added: svn:mime-type
   + application/octet-stream

Added: trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.info
===================================================================
--- trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.info                     
        (rev 0)
+++ trunk/JLanguageTool/src/resource/ml/hunspell/ml_IN.info     2012-06-30 
17:51:13 UTC (rev 7589)
@@ -0,0 +1,9 @@
+#
+# Dictionary properties.
+#
+
+fsa.dict.separator=+
+fsa.dict.encoding=utf-8
+
+fsa.dict.uses-prefixes=false
+fsa.dict.uses-infixes=false
\ No newline at end of file

Added: 
trunk/JLanguageTool/src/test/org/languagetool/rules/ml/MorfologikMalayalamSpellerRuleTest.java
===================================================================
--- 
trunk/JLanguageTool/src/test/org/languagetool/rules/ml/MorfologikMalayalamSpellerRuleTest.java
                              (rev 0)
+++ 
trunk/JLanguageTool/src/test/org/languagetool/rules/ml/MorfologikMalayalamSpellerRuleTest.java
      2012-06-30 17:51:13 UTC (rev 7589)
@@ -0,0 +1,52 @@
+package org.languagetool.rules.ml;
+
+import static org.junit.Assert.assertEquals;
+
+import java.io.IOException;
+
+import org.junit.Test;
+import org.languagetool.JLanguageTool;
+import org.languagetool.Language;
+import org.languagetool.TestTools;
+import org.languagetool.rules.RuleMatch;
+
+public class MorfologikMalayalamSpellerRuleTest {
+
+    @Test
+    public void testMorfologikSpeller() throws IOException {
+        MorfologikMalayalamSpellerRule rule =
+                new MorfologikMalayalamSpellerRule 
(TestTools.getMessages("Malayalam"), Language.MALAYALAM);
+
+        RuleMatch[] matches;
+        JLanguageTool langTool = new JLanguageTool(Language.MALAYALAM);
+
+
+        // correct sentences:
+        assertEquals(0, rule.match(langTool.getAnalyzedSentence("എന്തുകൊണ്ട്‌ 
അംഗത്വം")).length);
+        assertEquals(0, rule.match(langTool.getAnalyzedSentence("എങ്ങനെ 
അംഗമാകാം?")).length);        
+        //test for "LanguageTool":
+        assertEquals(0, 
rule.match(langTool.getAnalyzedSentence("LanguageTool")).length);
+        assertEquals(0, rule.match(langTool.getAnalyzedSentence(",")).length);
+        assertEquals(0, 
rule.match(langTool.getAnalyzedSentence("123454")).length);
+
+        //incorrect sentences:
+
+        matches = rule.match(langTool.getAnalyzedSentence("Zolw"));
+        // check match positions:
+        assertEquals(1, matches.length);
+        assertEquals(0, matches[0].getFromPos());
+        assertEquals(4, matches[0].getToPos());
+        assertEquals(matches[0].getSuggestedReplacements().isEmpty(), true);
+        
+        matches = rule.match(langTool.getAnalyzedSentence("എaങ്ങനെ"));
+        assertEquals(1, matches.length);
+        assertEquals(0, matches[0].getFromPos());
+        assertEquals(7, matches[0].getToPos());
+        assertEquals(matches[0].getSuggestedReplacements().get(0), "എങ്ങനെ");
+
+        assertEquals(1, 
rule.match(langTool.getAnalyzedSentence("aõh")).length);
+        assertEquals(1, rule.match(langTool.getAnalyzedSentence("a")).length);
+
+    }
+
+}


Property changes on: 
trunk/JLanguageTool/src/test/org/languagetool/rules/ml/MorfologikMalayalamSpellerRuleTest.java
___________________________________________________________________
Added: svn:mime-type
   + text/plain

This was sent by the SourceForge.net collaborative development platform, the 
world's largest Open Source development site.


------------------------------------------------------------------------------
Live Security Virtual Conference
Exclusive live event will cover all the ways today's security and 
threat landscape has changed and how IT managers can respond. Discussions 
will include endpoint security, mobile security and the latest in malware 
threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/
_______________________________________________
Languagetool-cvs mailing list
[email protected]
https://lists.sourceforge.net/lists/listinfo/languagetool-cvs

Reply via email to