Revision: 7956
          
http://languagetool.svn.sourceforge.net/languagetool/?rev=7956&view=rev
Author:   dnaber
Date:     2012-09-01 23:43:42 +0000 (Sat, 01 Sep 2012)
Log Message:
-----------
small code cleanup, no functional change

Modified Paths:
--------------
    
trunk/JLanguageTool/src/java/org/languagetool/tokenizers/zh/ChineseWordTokenizer.java

Modified: 
trunk/JLanguageTool/src/java/org/languagetool/tokenizers/zh/ChineseWordTokenizer.java
===================================================================
--- 
trunk/JLanguageTool/src/java/org/languagetool/tokenizers/zh/ChineseWordTokenizer.java
       2012-09-01 20:44:15 UTC (rev 7955)
+++ 
trunk/JLanguageTool/src/java/org/languagetool/tokenizers/zh/ChineseWordTokenizer.java
       2012-09-01 23:43:42 UTC (rev 7956)
@@ -20,10 +20,12 @@
 
 import java.io.InputStream;
 import java.util.ArrayList;
+import java.util.Arrays;
 import java.util.List;
 
 import org.ictclas4j.segment.SegTag;
 import org.languagetool.JLanguageTool;
+import org.languagetool.databroker.ResourceDataBroker;
 import org.languagetool.tokenizers.Tokenizer;
 
 import cn.com.cjf.CJFBeanFactory;
@@ -32,7 +34,6 @@
 public class ChineseWordTokenizer implements Tokenizer {
 
   private SegTag seg;
-
   private ChineseJF chinesdJF;
 
   private void init() {
@@ -40,24 +41,16 @@
       chinesdJF = CJFBeanFactory.getChineseJF();
     }
     if (seg == null) {
-      InputStream coreDictIn = 
JLanguageTool.getDataBroker().getFromResourceDirAsStream(
-          "/zh/coreDict.dct");
-      InputStream bigramDictIn = 
JLanguageTool.getDataBroker().getFromResourceDirAsStream(
-          "/zh/BigramDict.dct");
-      InputStream personTaggerDctIn = 
JLanguageTool.getDataBroker().getFromResourceDirAsStream(
-          "/zh/nr.dct");
-      InputStream personTaggerCtxIn = 
JLanguageTool.getDataBroker().getFromResourceDirAsStream(
-          "/zh/nr.ctx");
-      InputStream transPersonTaggerDctIn = JLanguageTool.getDataBroker()
-          .getFromResourceDirAsStream("/zh/tr.dct");
-      InputStream transPersonTaggerCtxIn = JLanguageTool.getDataBroker()
-          .getFromResourceDirAsStream("/zh/tr.ctx");
-      InputStream placeTaggerDctIn = 
JLanguageTool.getDataBroker().getFromResourceDirAsStream(
-          "/zh/ns.dct");
-      InputStream placeTaggerCtxIn = 
JLanguageTool.getDataBroker().getFromResourceDirAsStream(
-          "/zh/ns.ctx");
-      InputStream lexTaggerCtxIn = 
JLanguageTool.getDataBroker().getFromResourceDirAsStream(
-          "/zh/lexical.ctx");
+      final ResourceDataBroker dataBroker = JLanguageTool.getDataBroker();
+      final InputStream coreDictIn = 
dataBroker.getFromResourceDirAsStream("/zh/coreDict.dct");
+      final InputStream bigramDictIn = 
dataBroker.getFromResourceDirAsStream("/zh/BigramDict.dct");
+      final InputStream personTaggerDctIn = 
dataBroker.getFromResourceDirAsStream("/zh/nr.dct");
+      final InputStream personTaggerCtxIn = 
dataBroker.getFromResourceDirAsStream("/zh/nr.ctx");
+      final InputStream transPersonTaggerDctIn = 
dataBroker.getFromResourceDirAsStream("/zh/tr.dct");
+      final InputStream transPersonTaggerCtxIn = 
dataBroker.getFromResourceDirAsStream("/zh/tr.ctx");
+      final InputStream placeTaggerDctIn = 
dataBroker.getFromResourceDirAsStream("/zh/ns.dct");
+      final InputStream placeTaggerCtxIn = 
dataBroker.getFromResourceDirAsStream("/zh/ns.ctx");
+      final InputStream lexTaggerCtxIn = 
dataBroker.getFromResourceDirAsStream("/zh/lexical.ctx");
       seg = new SegTag(1, coreDictIn, bigramDictIn, personTaggerDctIn, 
personTaggerCtxIn,
           transPersonTaggerDctIn, transPersonTaggerCtxIn, placeTaggerDctIn, 
placeTaggerCtxIn,
           lexTaggerCtxIn);
@@ -67,8 +60,7 @@
   @Override
   public List<String> tokenize(String text) {
     init();
-    final ArrayList<String> ret = new ArrayList<String>();
-    String result;
+    final String result;
     try {
       result = seg.split(chinesdJF.chineseFan2Jan(text)).getFinalResult();
     } catch (Exception e) {
@@ -76,13 +68,9 @@
       // ArrayIndexOutOfBoundsException, due to some internal bugs of 
ictclas4j. The reasons of the
       // bugs and how to resolve them are unknown now. In this case, we can 
just bypass the sentence
       // and return a empty List.
-      return ret;
+      return new ArrayList<String>();
     }
     final String[] list = result.split(" ");
-
-    for (int i = 0; i < list.length; i++) {
-      ret.add(list[i]);
-    }
-    return ret;
+    return Arrays.asList(list);
   }
 }

This was sent by the SourceForge.net collaborative development platform, the 
world's largest Open Source development site.


------------------------------------------------------------------------------
Live Security Virtual Conference
Exclusive live event will cover all the ways today's security and 
threat landscape has changed and how IT managers can respond. Discussions 
will include endpoint security, mobile security and the latest in malware 
threats. http://www.accelacomm.com/jaw/sfrnl04242012/114/50122263/
_______________________________________________
Languagetool-cvs mailing list
Languagetool-cvs@lists.sourceforge.net
https://lists.sourceforge.net/lists/listinfo/languagetool-cvs

Reply via email to