Author: rmuir
Date: Wed Mar 17 05:38:14 2010
New Revision: 924164
URL: http://svn.apache.org/viewvc?rev=924164&view=rev
Log:
generate analysis factories for trunk's new lang support
Added:
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/BulgarianStemFilterFactory.java
(with props)
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/CzechStemFilterFactory.java
(with props)
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/HindiNormalizationFilterFactory.java
(with props)
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/HindiStemFilterFactory.java
(with props)
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/IndicNormalizationFilterFactory.java
(with props)
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/IndicTokenizerFactory.java
(with props)
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/TurkishLowerCaseFilterFactory.java
(with props)
lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestBulgarianStemFilterFactory.java
(with props)
lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestCzechStemFilterFactory.java
(with props)
lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestHindiFilters.java
(with props)
lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestTurkishLowerCaseFilterFactory.java
(with props)
Modified:
lucene/solr/branches/solr/lib/lucene-analyzers-3.1-dev.jar
Modified: lucene/solr/branches/solr/lib/lucene-analyzers-3.1-dev.jar
URL:
http://svn.apache.org/viewvc/lucene/solr/branches/solr/lib/lucene-analyzers-3.1-dev.jar?rev=924164&r1=924163&r2=924164&view=diff
==============================================================================
Binary files - no diff available.
Added:
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/BulgarianStemFilterFactory.java
URL:
http://svn.apache.org/viewvc/lucene/solr/branches/solr/src/java/org/apache/solr/analysis/BulgarianStemFilterFactory.java?rev=924164&view=auto
==============================================================================
---
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/BulgarianStemFilterFactory.java
(added)
+++
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/BulgarianStemFilterFactory.java
Wed Mar 17 05:38:14 2010
@@ -0,0 +1,28 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.bg.BulgarianStemFilter;
+
+/** Factory for BulgarianStemFilter */
+public class BulgarianStemFilterFactory extends BaseTokenFilterFactory {
+ public TokenStream create(TokenStream input) {
+ return new BulgarianStemFilter(input);
+ }
+}
Propchange:
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/BulgarianStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added:
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/CzechStemFilterFactory.java
URL:
http://svn.apache.org/viewvc/lucene/solr/branches/solr/src/java/org/apache/solr/analysis/CzechStemFilterFactory.java?rev=924164&view=auto
==============================================================================
---
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/CzechStemFilterFactory.java
(added)
+++
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/CzechStemFilterFactory.java
Wed Mar 17 05:38:14 2010
@@ -0,0 +1,28 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.cz.CzechStemFilter;
+
+/** Factory for CzechStemFilter */
+public class CzechStemFilterFactory extends BaseTokenFilterFactory {
+ public TokenStream create(TokenStream input) {
+ return new CzechStemFilter(input);
+ }
+}
Propchange:
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/CzechStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added:
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/HindiNormalizationFilterFactory.java
URL:
http://svn.apache.org/viewvc/lucene/solr/branches/solr/src/java/org/apache/solr/analysis/HindiNormalizationFilterFactory.java?rev=924164&view=auto
==============================================================================
---
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/HindiNormalizationFilterFactory.java
(added)
+++
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/HindiNormalizationFilterFactory.java
Wed Mar 17 05:38:14 2010
@@ -0,0 +1,28 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.hi.HindiNormalizationFilter;
+
+/** Factory for HindiNormalizationFilter */
+public class HindiNormalizationFilterFactory extends BaseTokenFilterFactory {
+ public TokenStream create(TokenStream input) {
+ return new HindiNormalizationFilter(input);
+ }
+}
Propchange:
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/HindiNormalizationFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added:
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/HindiStemFilterFactory.java
URL:
http://svn.apache.org/viewvc/lucene/solr/branches/solr/src/java/org/apache/solr/analysis/HindiStemFilterFactory.java?rev=924164&view=auto
==============================================================================
---
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/HindiStemFilterFactory.java
(added)
+++
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/HindiStemFilterFactory.java
Wed Mar 17 05:38:14 2010
@@ -0,0 +1,28 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.hi.HindiStemFilter;
+
+/** Factory for HindiStemFilter */
+public class HindiStemFilterFactory extends BaseTokenFilterFactory {
+ public TokenStream create(TokenStream input) {
+ return new HindiStemFilter(input);
+ }
+}
Propchange:
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/HindiStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added:
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/IndicNormalizationFilterFactory.java
URL:
http://svn.apache.org/viewvc/lucene/solr/branches/solr/src/java/org/apache/solr/analysis/IndicNormalizationFilterFactory.java?rev=924164&view=auto
==============================================================================
---
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/IndicNormalizationFilterFactory.java
(added)
+++
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/IndicNormalizationFilterFactory.java
Wed Mar 17 05:38:14 2010
@@ -0,0 +1,28 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.in.IndicNormalizationFilter;
+
+/** Factory for IndicNormalizationFilter */
+public class IndicNormalizationFilterFactory extends BaseTokenFilterFactory {
+ public TokenStream create(TokenStream input) {
+ return new IndicNormalizationFilter(input);
+ }
+}
Propchange:
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/IndicNormalizationFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added:
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/IndicTokenizerFactory.java
URL:
http://svn.apache.org/viewvc/lucene/solr/branches/solr/src/java/org/apache/solr/analysis/IndicTokenizerFactory.java?rev=924164&view=auto
==============================================================================
---
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/IndicTokenizerFactory.java
(added)
+++
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/IndicTokenizerFactory.java
Wed Mar 17 05:38:14 2010
@@ -0,0 +1,31 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.Reader;
+
+import org.apache.lucene.analysis.Tokenizer;
+import org.apache.lucene.analysis.in.IndicTokenizer;
+
+/** Factory for IndicTokenizer */
+public class IndicTokenizerFactory extends BaseTokenizerFactory {
+ public Tokenizer create(Reader input) {
+ assureMatchVersion();
+ return new IndicTokenizer(luceneMatchVersion, input);
+ }
+}
Propchange:
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/IndicTokenizerFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added:
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/TurkishLowerCaseFilterFactory.java
URL:
http://svn.apache.org/viewvc/lucene/solr/branches/solr/src/java/org/apache/solr/analysis/TurkishLowerCaseFilterFactory.java?rev=924164&view=auto
==============================================================================
---
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/TurkishLowerCaseFilterFactory.java
(added)
+++
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/TurkishLowerCaseFilterFactory.java
Wed Mar 17 05:38:14 2010
@@ -0,0 +1,28 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.tr.TurkishLowerCaseFilter;
+
+/** Factory for TurkishLowerCaseFilter */
+public class TurkishLowerCaseFilterFactory extends BaseTokenFilterFactory {
+ public TokenStream create(TokenStream input) {
+ return new TurkishLowerCaseFilter(input);
+ }
+}
Propchange:
lucene/solr/branches/solr/src/java/org/apache/solr/analysis/TurkishLowerCaseFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added:
lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestBulgarianStemFilterFactory.java
URL:
http://svn.apache.org/viewvc/lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestBulgarianStemFilterFactory.java?rev=924164&view=auto
==============================================================================
---
lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestBulgarianStemFilterFactory.java
(added)
+++
lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestBulgarianStemFilterFactory.java
Wed Mar 17 05:38:14 2010
@@ -0,0 +1,41 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.Reader;
+import java.io.StringReader;
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.Tokenizer;
+import org.apache.lucene.analysis.WhitespaceTokenizer;
+
+/**
+ * Simple tests to ensure the Bulgarian stem filter factory is working.
+ */
+public class TestBulgarianStemFilterFactory extends BaseTokenTestCase {
+ /**
+ * Ensure the filter actually stems text.
+ */
+ public void testStemming() throws Exception {
+ Reader reader = new StringReader("компÑÑÑи");
+ Tokenizer tokenizer = new WhitespaceTokenizer(reader);
+ BulgarianStemFilterFactory factory = new BulgarianStemFilterFactory();
+ TokenStream stream = factory.create(tokenizer);
+ assertTokenStreamContents(stream, new String[] { "компÑÑÑ" });
+ }
+}
Propchange:
lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestBulgarianStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added:
lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestCzechStemFilterFactory.java
URL:
http://svn.apache.org/viewvc/lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestCzechStemFilterFactory.java?rev=924164&view=auto
==============================================================================
---
lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestCzechStemFilterFactory.java
(added)
+++
lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestCzechStemFilterFactory.java
Wed Mar 17 05:38:14 2010
@@ -0,0 +1,41 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.Reader;
+import java.io.StringReader;
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.Tokenizer;
+import org.apache.lucene.analysis.WhitespaceTokenizer;
+
+/**
+ * Simple tests to ensure the Czech stem filter factory is working.
+ */
+public class TestCzechStemFilterFactory extends BaseTokenTestCase {
+ /**
+ * Ensure the filter actually stems text.
+ */
+ public void testStemming() throws Exception {
+ Reader reader = new StringReader("angliÄtÃ");
+ Tokenizer tokenizer = new WhitespaceTokenizer(reader);
+ CzechStemFilterFactory factory = new CzechStemFilterFactory();
+ TokenStream stream = factory.create(tokenizer);
+ assertTokenStreamContents(stream, new String[] { "anglick" });
+ }
+}
Propchange:
lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestCzechStemFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native
Added:
lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestHindiFilters.java
URL:
http://svn.apache.org/viewvc/lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestHindiFilters.java?rev=924164&view=auto
==============================================================================
---
lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestHindiFilters.java
(added)
+++
lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestHindiFilters.java
Wed Mar 17 05:38:14 2010
@@ -0,0 +1,89 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.Reader;
+import java.io.StringReader;
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.Tokenizer;
+
+/**
+ * Simple tests to ensure the Hindi filter Factories are working.
+ */
+public class TestHindiFilters extends BaseTokenTestCase {
+ /**
+ * Test IndicTokenizerFactory
+ */
+ public void testTokenizer() throws Exception {
+ Reader reader = new StringReader("मà¥à¤à¥ हिà¤à¤¦à¥ à¤à¤¾
à¤à¤° à¤
à¤à¥à¤¯à¤¾à¤¸ à¤à¤°à¤¨à¤¾ हà¥à¤à¤¾ ।");
+ IndicTokenizerFactory factory = new IndicTokenizerFactory();
+ factory.init(DEFAULT_VERSION_PARAM);
+ Tokenizer stream = factory.create(reader);
+ assertTokenStreamContents(stream,
+ new String[] { "मà¥à¤à¥", "हिà¤à¤¦à¥", "à¤à¤¾", "à¤à¤°",
"à¤
à¤à¥à¤¯à¤¾à¤¸", "à¤à¤°à¤¨à¤¾", "हà¥à¤à¤¾" });
+ }
+
+ /**
+ * Test IndicNormalizationFilterFactory
+ */
+ public void testIndicNormalizer() throws Exception {
+ Reader reader = new StringReader("তà§â à¤
ाà¥à¤°");
+ IndicTokenizerFactory factory = new IndicTokenizerFactory();
+ IndicNormalizationFilterFactory filterFactory = new
IndicNormalizationFilterFactory();
+ factory.init(DEFAULT_VERSION_PARAM);
+ filterFactory.init(DEFAULT_VERSION_PARAM);
+ Tokenizer tokenizer = factory.create(reader);
+ TokenStream stream = filterFactory.create(tokenizer);
+ assertTokenStreamContents(stream, new String[] { "à§", "à¤à¤°" });
+ }
+
+ /**
+ * Test HindiNormalizationFilterFactory
+ */
+ public void testHindiNormalizer() throws Exception {
+ Reader reader = new StringReader("à¥à¤¿à¤¤à¤¾à¤¬");
+ IndicTokenizerFactory factory = new IndicTokenizerFactory();
+ IndicNormalizationFilterFactory indicFilterFactory = new
IndicNormalizationFilterFactory();
+ HindiNormalizationFilterFactory hindiFilterFactory = new
HindiNormalizationFilterFactory();
+ factory.init(DEFAULT_VERSION_PARAM);
+ hindiFilterFactory.init(DEFAULT_VERSION_PARAM);
+ Tokenizer tokenizer = factory.create(reader);
+ TokenStream stream = indicFilterFactory.create(tokenizer);
+ stream = hindiFilterFactory.create(stream);
+ assertTokenStreamContents(stream, new String[] {"à¤à¤¿à¤¤à¤¾à¤¬"});
+ }
+
+ /**
+ * Test HindiStemFilterFactory
+ */
+ public void testStemmer() throws Exception {
+ Reader reader = new StringReader("à¤à¤¿à¤¤à¤¾à¤¬à¥à¤");
+ IndicTokenizerFactory factory = new IndicTokenizerFactory();
+ IndicNormalizationFilterFactory indicFilterFactory = new
IndicNormalizationFilterFactory();
+ HindiNormalizationFilterFactory hindiFilterFactory = new
HindiNormalizationFilterFactory();
+ HindiStemFilterFactory stemFactory = new HindiStemFilterFactory();
+ factory.init(DEFAULT_VERSION_PARAM);
+ stemFactory.init(DEFAULT_VERSION_PARAM);
+ Tokenizer tokenizer = factory.create(reader);
+ TokenStream stream = indicFilterFactory.create(tokenizer);
+ stream = hindiFilterFactory.create(stream);
+ stream = stemFactory.create(stream);
+ assertTokenStreamContents(stream, new String[] {"à¤à¤¿à¤¤à¤¾à¤¬"});
+ }
+}
Propchange:
lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestHindiFilters.java
------------------------------------------------------------------------------
svn:eol-style = native
Added:
lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestTurkishLowerCaseFilterFactory.java
URL:
http://svn.apache.org/viewvc/lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestTurkishLowerCaseFilterFactory.java?rev=924164&view=auto
==============================================================================
---
lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestTurkishLowerCaseFilterFactory.java
(added)
+++
lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestTurkishLowerCaseFilterFactory.java
Wed Mar 17 05:38:14 2010
@@ -0,0 +1,41 @@
+package org.apache.solr.analysis;
+
+/**
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+import java.io.Reader;
+import java.io.StringReader;
+
+import org.apache.lucene.analysis.TokenStream;
+import org.apache.lucene.analysis.Tokenizer;
+import org.apache.lucene.analysis.WhitespaceTokenizer;
+
+/**
+ * Simple tests to ensure the Turkish lowercase filter factory is working.
+ */
+public class TestTurkishLowerCaseFilterFactory extends BaseTokenTestCase {
+ /**
+ * Ensure the filter actually lowercases text.
+ */
+ public void testCasing() throws Exception {
+ Reader reader = new StringReader("AÄACI");
+ Tokenizer tokenizer = new WhitespaceTokenizer(reader);
+ TurkishLowerCaseFilterFactory factory = new
TurkishLowerCaseFilterFactory();
+ TokenStream stream = factory.create(tokenizer);
+ assertTokenStreamContents(stream, new String[] { "aÄacı" });
+ }
+}
Propchange:
lucene/solr/branches/solr/src/test/org/apache/solr/analysis/TestTurkishLowerCaseFilterFactory.java
------------------------------------------------------------------------------
svn:eol-style = native