This is an automated email from the ASF dual-hosted git repository.
rzo1 pushed a commit to branch OPENNLP-1627
in repository https://gitbox.apache.org/repos/asf/opennlp-models.git
The following commit(s) were added to refs/heads/OPENNLP-1627 by this push:
new 5c0fc3f OPENNLP-1627 - Add Czech models
5c0fc3f is described below
commit 5c0fc3fc7951380a267a2c07def182fdccc04278
Author: Richard Zowalla <[email protected]>
AuthorDate: Tue Oct 15 09:40:06 2024 +0200
OPENNLP-1627 - Add Czech models
---
opennlp-models-pos/opennlp-models-pos-cs/pom.xml | 73 +++++++++++++++++++++
.../src/main/resources/model.properties | 19 ++++++
opennlp-models-pos/pom.xml | 1 +
.../opennlp-models-sentdetect-cs/pom.xml | 74 ++++++++++++++++++++++
.../src/main/resources/model.properties | 19 ++++++
opennlp-models-sentdetect/pom.xml | 1 +
opennlp-models-test/pom.xml | 15 +++++
.../src/main/resources/expected-models.txt | 3 +
.../opennlp-models-tokenizer-cs/pom.xml | 74 ++++++++++++++++++++++
.../src/main/resources/model.properties | 19 ++++++
opennlp-models-tokenizer/pom.xml | 1 +
11 files changed, 299 insertions(+)
diff --git a/opennlp-models-pos/opennlp-models-pos-cs/pom.xml
b/opennlp-models-pos/opennlp-models-pos-cs/pom.xml
new file mode 100644
index 0000000..5bc5634
--- /dev/null
+++ b/opennlp-models-pos/opennlp-models-pos-cs/pom.xml
@@ -0,0 +1,73 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<!--
+Licensed to the Apache Software Foundation (ASF) under one
+or more contributor license agreements. See the NOTICE file
+distributed with this work for additional information
+regarding copyright ownership. The ASF licenses this file
+to you under the Apache License, Version 2.0 (the
+"License"); you may not use this file except in compliance
+with the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing,
+software distributed under the License is distributed on an
+"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+KIND, either express or implied. See the License for the
+specific language governing permissions and limitations
+under the License.
+-->
+
+<project xmlns="http://maven.apache.org/POM/4.0.0"
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
xsi:schemaLocation="http://maven.apache.org/POM/4.0.0
http://maven.apache.org/xsd/maven-4.0.0.xsd">
+ <modelVersion>4.0.0</modelVersion>
+ <parent>
+ <groupId>org.apache.opennlp</groupId>
+ <artifactId>opennlp-models-pos</artifactId>
+ <version>1.1.0-SNAPSHOT</version>
+ </parent>
+
+ <name>Apache OpenNLP Models :: Part-Of-Speech :: Czech</name>
+ <artifactId>opennlp-models-pos-cs</artifactId>
+
+ <properties>
+ <dist.base>${asf.dist.base}</dist.base>
+ <model.family>ud-models-1.1</model.family>
+ <model.name>opennlp-cs-ud-pdt-pos-1.1-2.4.0.bin</model.name>
+ <model.version>2.4.0</model.version>
+
<model.sha256>02e15f3ee385e2da83eab7582aa3a5076a91889d51dcb33e773f3ecbd24a9cf0</model.sha256>
+ <model.language>cs</model.language>
+ </properties>
+
+ <build>
+ <resources>
+ <resource>
+ <directory>src/main/resources</directory>
+ <filtering>true</filtering>
+ <includes>
+ <include>**/model.properties</include>
+ </includes>
+ </resource>
+ <resource>
+ <directory>src/main/resources</directory>
+ <includes>
+ <include>**/*.bin</include>
+ </includes>
+ </resource>
+ </resources>
+ <plugins>
+ <plugin>
+ <groupId>com.googlecode.maven-download-plugin</groupId>
+ <artifactId>download-maven-plugin</artifactId>
+ <configuration>
+ <url>${dist.base}/${model.family}/${model.name}</url>
+ </configuration>
+ </plugin>
+ <plugin>
+ <groupId>org.codehaus.mojo</groupId>
+ <artifactId>build-helper-maven-plugin</artifactId>
+ </plugin>
+ </plugins>
+ </build>
+
+</project>
\ No newline at end of file
diff --git
a/opennlp-models-pos/opennlp-models-pos-cs/src/main/resources/model.properties
b/opennlp-models-pos/opennlp-models-pos-cs/src/main/resources/model.properties
new file mode 100644
index 0000000..2be8681
--- /dev/null
+++
b/opennlp-models-pos/opennlp-models-pos-cs/src/main/resources/model.properties
@@ -0,0 +1,19 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements. See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+model.name=${model.name}
+model.version=${model.version}
+model.sha256=${model.sha256}
+model.language=${model.language}
\ No newline at end of file
diff --git a/opennlp-models-pos/pom.xml b/opennlp-models-pos/pom.xml
index adb586e..8c7a595 100644
--- a/opennlp-models-pos/pom.xml
+++ b/opennlp-models-pos/pom.xml
@@ -33,6 +33,7 @@ under the License.
<modules>
<module>opennlp-models-pos-bg</module>
+ <module>opennlp-models-pos-cs</module>
<module>opennlp-models-pos-de</module>
<module>opennlp-models-pos-en</module>
<module>opennlp-models-pos-fr</module>
diff --git a/opennlp-models-sentdetect/opennlp-models-sentdetect-cs/pom.xml
b/opennlp-models-sentdetect/opennlp-models-sentdetect-cs/pom.xml
new file mode 100644
index 0000000..9cb7301
--- /dev/null
+++ b/opennlp-models-sentdetect/opennlp-models-sentdetect-cs/pom.xml
@@ -0,0 +1,74 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<!--
+Licensed to the Apache Software Foundation (ASF) under one
+or more contributor license agreements. See the NOTICE file
+distributed with this work for additional information
+regarding copyright ownership. The ASF licenses this file
+to you under the Apache License, Version 2.0 (the
+"License"); you may not use this file except in compliance
+with the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing,
+software distributed under the License is distributed on an
+"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+KIND, either express or implied. See the License for the
+specific language governing permissions and limitations
+under the License.
+-->
+
+<project xmlns="http://maven.apache.org/POM/4.0.0"
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
xsi:schemaLocation="http://maven.apache.org/POM/4.0.0
http://maven.apache.org/xsd/maven-4.0.0.xsd">
+ <modelVersion>4.0.0</modelVersion>
+ <parent>
+ <groupId>org.apache.opennlp</groupId>
+ <artifactId>opennlp-models-sentdetect</artifactId>
+ <version>1.1.0-SNAPSHOT</version>
+ </parent>
+
+ <artifactId>opennlp-models-sentdetect-cs</artifactId>
+
+ <name>Apache OpenNLP Models :: Sent-Detect :: Czech</name>
+
+ <properties>
+ <dist.base>${asf.dist.base}</dist.base>
+ <model.family>ud-models-1.1</model.family>
+ <model.name>opennlp-cs-ud-pdt-sentence-1.1-2.4.0.bin</model.name>
+ <model.version>2.4.0</model.version>
+
<model.sha256>f286a44a465d2d38ae7e0b0c67e239cbc1fad24e29f27f2b8be3ccd6c2853ae3</model.sha256>
+ <model.language>cs</model.language>
+ </properties>
+
+ <build>
+ <resources>
+ <resource>
+ <directory>src/main/resources</directory>
+ <filtering>true</filtering>
+ <includes>
+ <include>**/model.properties</include>
+ </includes>
+ </resource>
+ <resource>
+ <directory>src/main/resources</directory>
+ <includes>
+ <include>**/*.bin</include>
+ </includes>
+ </resource>
+ </resources>
+ <plugins>
+ <plugin>
+ <groupId>com.googlecode.maven-download-plugin</groupId>
+ <artifactId>download-maven-plugin</artifactId>
+ <configuration>
+ <url>${dist.base}/${model.family}/${model.name}</url>
+ </configuration>
+ </plugin>
+ <plugin>
+ <groupId>org.codehaus.mojo</groupId>
+ <artifactId>build-helper-maven-plugin</artifactId>
+ </plugin>
+ </plugins>
+ </build>
+
+</project>
\ No newline at end of file
diff --git
a/opennlp-models-sentdetect/opennlp-models-sentdetect-cs/src/main/resources/model.properties
b/opennlp-models-sentdetect/opennlp-models-sentdetect-cs/src/main/resources/model.properties
new file mode 100644
index 0000000..2be8681
--- /dev/null
+++
b/opennlp-models-sentdetect/opennlp-models-sentdetect-cs/src/main/resources/model.properties
@@ -0,0 +1,19 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements. See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+model.name=${model.name}
+model.version=${model.version}
+model.sha256=${model.sha256}
+model.language=${model.language}
\ No newline at end of file
diff --git a/opennlp-models-sentdetect/pom.xml
b/opennlp-models-sentdetect/pom.xml
index 1f6bd5d..43f70f1 100644
--- a/opennlp-models-sentdetect/pom.xml
+++ b/opennlp-models-sentdetect/pom.xml
@@ -35,6 +35,7 @@ under the License.
<modules>
<module>opennlp-models-sentdetect-bg</module>
+ <module>opennlp-models-sentdetect-cs</module>
<module>opennlp-models-sentdetect-de</module>
<module>opennlp-models-sentdetect-it</module>
<module>opennlp-models-sentdetect-en</module>
diff --git a/opennlp-models-test/pom.xml b/opennlp-models-test/pom.xml
index c85117e..d4423ac 100644
--- a/opennlp-models-test/pom.xml
+++ b/opennlp-models-test/pom.xml
@@ -37,6 +37,11 @@ under the License.
<artifactId>opennlp-models-sentdetect-bg</artifactId>
<version>${project.version}</version>
</dependency>
+ <dependency>
+ <groupId>org.apache.opennlp</groupId>
+ <artifactId>opennlp-models-sentdetect-cs</artifactId>
+ <version>${project.version}</version>
+ </dependency>
<dependency>
<groupId>org.apache.opennlp</groupId>
<artifactId>opennlp-models-sentdetect-de</artifactId>
@@ -67,6 +72,11 @@ under the License.
<artifactId>opennlp-models-tokenizer-bg</artifactId>
<version>${project.version}</version>
</dependency>
+ <dependency>
+ <groupId>org.apache.opennlp</groupId>
+ <artifactId>opennlp-models-tokenizer-cs</artifactId>
+ <version>${project.version}</version>
+ </dependency>
<dependency>
<groupId>org.apache.opennlp</groupId>
<artifactId>opennlp-models-tokenizer-de</artifactId>
@@ -97,6 +107,11 @@ under the License.
<artifactId>opennlp-models-pos-bg</artifactId>
<version>${project.version}</version>
</dependency>
+ <dependency>
+ <groupId>org.apache.opennlp</groupId>
+ <artifactId>opennlp-models-pos-cs</artifactId>
+ <version>${project.version}</version>
+ </dependency>
<dependency>
<groupId>org.apache.opennlp</groupId>
<artifactId>opennlp-models-pos-de</artifactId>
diff --git a/opennlp-models-test/src/main/resources/expected-models.txt
b/opennlp-models-test/src/main/resources/expected-models.txt
index 228e4ac..be8e69a 100644
--- a/opennlp-models-test/src/main/resources/expected-models.txt
+++ b/opennlp-models-test/src/main/resources/expected-models.txt
@@ -17,6 +17,7 @@
langdetect-183.bin
# Sentence Detection
opennlp-bg-ud-btb-sentence-1.1-2.4.0.bin
+opennlp-cs-ud-pdt-sentence-1.1-2.4.0.bin
opennlp-de-ud-gsd-sentence-1.1-2.4.0.bin
opennlp-en-ud-ewt-sentence-1.1-2.4.0.bin
opennlp-fr-ud-gsd-sentence-1.1-2.4.0.bin
@@ -24,6 +25,7 @@ opennlp-it-ud-vit-sentence-1.1-2.4.0.bin
opennlp-nl-ud-alpino-sentence-1.1-2.4.0.bin
# POS
opennlp-bg-ud-btb-pos-1.1-2.4.0.bin
+opennlp-cs-ud-pdt-pos-1.1-2.4.0.bin
opennlp-de-ud-gsd-pos-1.1-2.4.0.bin
opennlp-de-ud-gsd-pos-1.1-2.4.0.bin
opennlp-fr-ud-gsd-pos-1.1-2.4.0.bin
@@ -31,6 +33,7 @@ opennlp-it-ud-vit-pos-1.1-2.4.0.bin
opennlp-nl-ud-alpino-pos-1.1-2.4.0.bin
# Tokens
opennlp-bg-ud-btb-tokens-1.1-2.4.0.bin
+opennlp-cs-ud-pdt-tokens-1.1-2.4.0.bin
opennlp-de-ud-gsd-tokens-1.1-2.4.0.bin
opennlp-en-ud-ewt-tokens-1.1-2.4.0.bin
opennlp-fr-ud-gsd-tokens-1.1-2.4.0.bin
diff --git a/opennlp-models-tokenizer/opennlp-models-tokenizer-cs/pom.xml
b/opennlp-models-tokenizer/opennlp-models-tokenizer-cs/pom.xml
new file mode 100644
index 0000000..7642f12
--- /dev/null
+++ b/opennlp-models-tokenizer/opennlp-models-tokenizer-cs/pom.xml
@@ -0,0 +1,74 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<!--
+Licensed to the Apache Software Foundation (ASF) under one
+or more contributor license agreements. See the NOTICE file
+distributed with this work for additional information
+regarding copyright ownership. The ASF licenses this file
+to you under the Apache License, Version 2.0 (the
+"License"); you may not use this file except in compliance
+with the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing,
+software distributed under the License is distributed on an
+"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+KIND, either express or implied. See the License for the
+specific language governing permissions and limitations
+under the License.
+-->
+
+<project xmlns="http://maven.apache.org/POM/4.0.0"
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
xsi:schemaLocation="http://maven.apache.org/POM/4.0.0
http://maven.apache.org/xsd/maven-4.0.0.xsd">
+ <modelVersion>4.0.0</modelVersion>
+ <parent>
+ <groupId>org.apache.opennlp</groupId>
+ <artifactId>opennlp-models-tokenizer</artifactId>
+ <version>1.1.0-SNAPSHOT</version>
+ </parent>
+
+ <artifactId>opennlp-models-tokenizer-cs</artifactId>
+
+ <name>Apache OpenNLP Models :: Tokenizer :: Czech</name>
+
+ <properties>
+ <dist.base>${asf.dist.base}</dist.base>
+ <model.family>ud-models-1.1</model.family>
+ <model.name>opennlp-cs-ud-pdt-tokens-1.1-2.4.0.bin</model.name>
+ <model.version>2.4.0</model.version>
+
<model.sha256>5028cf16f7cb6adeab07ffbb2873923cce6c6002a98f6df033afd8852efdd450</model.sha256>
+ <model.language>cs</model.language>
+ </properties>
+
+ <build>
+ <resources>
+ <resource>
+ <directory>src/main/resources</directory>
+ <filtering>true</filtering>
+ <includes>
+ <include>**/model.properties</include>
+ </includes>
+ </resource>
+ <resource>
+ <directory>src/main/resources</directory>
+ <includes>
+ <include>**/*.bin</include>
+ </includes>
+ </resource>
+ </resources>
+ <plugins>
+ <plugin>
+ <groupId>com.googlecode.maven-download-plugin</groupId>
+ <artifactId>download-maven-plugin</artifactId>
+ <configuration>
+ <url>${dist.base}/${model.family}/${model.name}</url>
+ </configuration>
+ </plugin>
+ <plugin>
+ <groupId>org.codehaus.mojo</groupId>
+ <artifactId>build-helper-maven-plugin</artifactId>
+ </plugin>
+ </plugins>
+ </build>
+
+</project>
\ No newline at end of file
diff --git
a/opennlp-models-tokenizer/opennlp-models-tokenizer-cs/src/main/resources/model.properties
b/opennlp-models-tokenizer/opennlp-models-tokenizer-cs/src/main/resources/model.properties
new file mode 100644
index 0000000..2be8681
--- /dev/null
+++
b/opennlp-models-tokenizer/opennlp-models-tokenizer-cs/src/main/resources/model.properties
@@ -0,0 +1,19 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements. See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+model.name=${model.name}
+model.version=${model.version}
+model.sha256=${model.sha256}
+model.language=${model.language}
\ No newline at end of file
diff --git a/opennlp-models-tokenizer/pom.xml b/opennlp-models-tokenizer/pom.xml
index e2c65e7..14087f6 100644
--- a/opennlp-models-tokenizer/pom.xml
+++ b/opennlp-models-tokenizer/pom.xml
@@ -35,6 +35,7 @@ under the License.
<modules>
<module>opennlp-models-tokenizer-bg</module>
+ <module>opennlp-models-tokenizer-cs</module>
<module>opennlp-models-tokenizer-de</module>
<module>opennlp-models-tokenizer-en</module>
<module>opennlp-models-tokenizer-fr</module>