This is an automated email from the ASF dual-hosted git repository.
rzo1 pushed a commit to branch OPENNLP-1627
in repository https://gitbox.apache.org/repos/asf/opennlp-models.git
The following commit(s) were added to refs/heads/OPENNLP-1627 by this push:
new f25db52 OPENNLP-1627 - Add Croatian models
f25db52 is described below
commit f25db52453a8e0c3b0fa8e4b1c34e4062bc102a3
Author: Richard Zowalla <[email protected]>
AuthorDate: Tue Oct 15 09:48:16 2024 +0200
OPENNLP-1627 - Add Croatian models
---
opennlp-models-pos/opennlp-models-pos-hr/pom.xml | 73 +++++++++++++++++++++
.../src/main/resources/model.properties | 19 ++++++
opennlp-models-pos/pom.xml | 1 +
.../opennlp-models-sentdetect-hr/pom.xml | 74 ++++++++++++++++++++++
.../src/main/resources/model.properties | 19 ++++++
opennlp-models-sentdetect/pom.xml | 1 +
opennlp-models-test/pom.xml | 15 +++++
.../src/main/resources/expected-models.txt | 9 ++-
.../opennlp-models-tokenizer-hr/pom.xml | 74 ++++++++++++++++++++++
.../src/main/resources/model.properties | 19 ++++++
opennlp-models-tokenizer/pom.xml | 1 +
11 files changed, 302 insertions(+), 3 deletions(-)
diff --git a/opennlp-models-pos/opennlp-models-pos-hr/pom.xml
b/opennlp-models-pos/opennlp-models-pos-hr/pom.xml
new file mode 100644
index 0000000..7fadb40
--- /dev/null
+++ b/opennlp-models-pos/opennlp-models-pos-hr/pom.xml
@@ -0,0 +1,73 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<!--
+Licensed to the Apache Software Foundation (ASF) under one
+or more contributor license agreements. See the NOTICE file
+distributed with this work for additional information
+regarding copyright ownership. The ASF licenses this file
+to you under the Apache License, Version 2.0 (the
+"License"); you may not use this file except in compliance
+with the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing,
+software distributed under the License is distributed on an
+"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+KIND, either express or implied. See the License for the
+specific language governing permissions and limitations
+under the License.
+-->
+
+<project xmlns="http://maven.apache.org/POM/4.0.0"
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
xsi:schemaLocation="http://maven.apache.org/POM/4.0.0
http://maven.apache.org/xsd/maven-4.0.0.xsd">
+ <modelVersion>4.0.0</modelVersion>
+ <parent>
+ <groupId>org.apache.opennlp</groupId>
+ <artifactId>opennlp-models-pos</artifactId>
+ <version>1.1.0-SNAPSHOT</version>
+ </parent>
+
+ <name>Apache OpenNLP Models :: Part-Of-Speech :: Croatian</name>
+ <artifactId>opennlp-models-pos-hr</artifactId>
+
+ <properties>
+ <dist.base>${asf.dist.base}</dist.base>
+ <model.family>ud-models-1.1</model.family>
+ <model.name>opennlp-hr-ud-set-pos-1.1-2.4.0.bin</model.name>
+ <model.version>2.4.0</model.version>
+
<model.sha256>8cce65a4343cd82ce03f076ad21143a6245667dabcf69e38af5b5e5652b0e163</model.sha256>
+ <model.language>hr</model.language>
+ </properties>
+
+ <build>
+ <resources>
+ <resource>
+ <directory>src/main/resources</directory>
+ <filtering>true</filtering>
+ <includes>
+ <include>**/model.properties</include>
+ </includes>
+ </resource>
+ <resource>
+ <directory>src/main/resources</directory>
+ <includes>
+ <include>**/*.bin</include>
+ </includes>
+ </resource>
+ </resources>
+ <plugins>
+ <plugin>
+ <groupId>com.googlecode.maven-download-plugin</groupId>
+ <artifactId>download-maven-plugin</artifactId>
+ <configuration>
+ <url>${dist.base}/${model.family}/${model.name}</url>
+ </configuration>
+ </plugin>
+ <plugin>
+ <groupId>org.codehaus.mojo</groupId>
+ <artifactId>build-helper-maven-plugin</artifactId>
+ </plugin>
+ </plugins>
+ </build>
+
+</project>
\ No newline at end of file
diff --git
a/opennlp-models-pos/opennlp-models-pos-hr/src/main/resources/model.properties
b/opennlp-models-pos/opennlp-models-pos-hr/src/main/resources/model.properties
new file mode 100644
index 0000000..2be8681
--- /dev/null
+++
b/opennlp-models-pos/opennlp-models-pos-hr/src/main/resources/model.properties
@@ -0,0 +1,19 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements. See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+model.name=${model.name}
+model.version=${model.version}
+model.sha256=${model.sha256}
+model.language=${model.language}
\ No newline at end of file
diff --git a/opennlp-models-pos/pom.xml b/opennlp-models-pos/pom.xml
index 8c7a595..cd76da6 100644
--- a/opennlp-models-pos/pom.xml
+++ b/opennlp-models-pos/pom.xml
@@ -37,6 +37,7 @@ under the License.
<module>opennlp-models-pos-de</module>
<module>opennlp-models-pos-en</module>
<module>opennlp-models-pos-fr</module>
+ <module>opennlp-models-pos-hr</module>
<module>opennlp-models-pos-it</module>
<module>opennlp-models-pos-nl</module>
</modules>
diff --git a/opennlp-models-sentdetect/opennlp-models-sentdetect-hr/pom.xml
b/opennlp-models-sentdetect/opennlp-models-sentdetect-hr/pom.xml
new file mode 100644
index 0000000..1c81b6d
--- /dev/null
+++ b/opennlp-models-sentdetect/opennlp-models-sentdetect-hr/pom.xml
@@ -0,0 +1,74 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<!--
+Licensed to the Apache Software Foundation (ASF) under one
+or more contributor license agreements. See the NOTICE file
+distributed with this work for additional information
+regarding copyright ownership. The ASF licenses this file
+to you under the Apache License, Version 2.0 (the
+"License"); you may not use this file except in compliance
+with the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing,
+software distributed under the License is distributed on an
+"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+KIND, either express or implied. See the License for the
+specific language governing permissions and limitations
+under the License.
+-->
+
+<project xmlns="http://maven.apache.org/POM/4.0.0"
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
xsi:schemaLocation="http://maven.apache.org/POM/4.0.0
http://maven.apache.org/xsd/maven-4.0.0.xsd">
+ <modelVersion>4.0.0</modelVersion>
+ <parent>
+ <groupId>org.apache.opennlp</groupId>
+ <artifactId>opennlp-models-sentdetect</artifactId>
+ <version>1.1.0-SNAPSHOT</version>
+ </parent>
+
+ <artifactId>opennlp-models-sentdetect-hr</artifactId>
+
+ <name>Apache OpenNLP Models :: Sent-Detect :: Croatian</name>
+
+ <properties>
+ <dist.base>${asf.dist.base}</dist.base>
+ <model.family>ud-models-1.1</model.family>
+ <model.name>opennlp-hr-ud-set-sentence-1.1-2.4.0.bin</model.name>
+ <model.version>2.4.0</model.version>
+
<model.sha256>eaba8fa68191189c3e3377c526293d044b2c069415234ab040e628e1d5a926b2</model.sha256>
+ <model.language>hr</model.language>
+ </properties>
+
+ <build>
+ <resources>
+ <resource>
+ <directory>src/main/resources</directory>
+ <filtering>true</filtering>
+ <includes>
+ <include>**/model.properties</include>
+ </includes>
+ </resource>
+ <resource>
+ <directory>src/main/resources</directory>
+ <includes>
+ <include>**/*.bin</include>
+ </includes>
+ </resource>
+ </resources>
+ <plugins>
+ <plugin>
+ <groupId>com.googlecode.maven-download-plugin</groupId>
+ <artifactId>download-maven-plugin</artifactId>
+ <configuration>
+ <url>${dist.base}/${model.family}/${model.name}</url>
+ </configuration>
+ </plugin>
+ <plugin>
+ <groupId>org.codehaus.mojo</groupId>
+ <artifactId>build-helper-maven-plugin</artifactId>
+ </plugin>
+ </plugins>
+ </build>
+
+</project>
\ No newline at end of file
diff --git
a/opennlp-models-sentdetect/opennlp-models-sentdetect-hr/src/main/resources/model.properties
b/opennlp-models-sentdetect/opennlp-models-sentdetect-hr/src/main/resources/model.properties
new file mode 100644
index 0000000..2be8681
--- /dev/null
+++
b/opennlp-models-sentdetect/opennlp-models-sentdetect-hr/src/main/resources/model.properties
@@ -0,0 +1,19 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements. See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+model.name=${model.name}
+model.version=${model.version}
+model.sha256=${model.sha256}
+model.language=${model.language}
\ No newline at end of file
diff --git a/opennlp-models-sentdetect/pom.xml
b/opennlp-models-sentdetect/pom.xml
index 43f70f1..67369a8 100644
--- a/opennlp-models-sentdetect/pom.xml
+++ b/opennlp-models-sentdetect/pom.xml
@@ -37,6 +37,7 @@ under the License.
<module>opennlp-models-sentdetect-bg</module>
<module>opennlp-models-sentdetect-cs</module>
<module>opennlp-models-sentdetect-de</module>
+ <module>opennlp-models-sentdetect-hr</module>
<module>opennlp-models-sentdetect-it</module>
<module>opennlp-models-sentdetect-en</module>
<module>opennlp-models-sentdetect-fr</module>
diff --git a/opennlp-models-test/pom.xml b/opennlp-models-test/pom.xml
index d4423ac..5ba6bf1 100644
--- a/opennlp-models-test/pom.xml
+++ b/opennlp-models-test/pom.xml
@@ -52,6 +52,11 @@ under the License.
<artifactId>opennlp-models-sentdetect-en</artifactId>
<version>${project.version}</version>
</dependency>
+ <dependency>
+ <groupId>org.apache.opennlp</groupId>
+ <artifactId>opennlp-models-sentdetect-hr</artifactId>
+ <version>${project.version}</version>
+ </dependency>
<dependency>
<groupId>org.apache.opennlp</groupId>
<artifactId>opennlp-models-sentdetect-it</artifactId>
@@ -87,6 +92,11 @@ under the License.
<artifactId>opennlp-models-tokenizer-en</artifactId>
<version>${project.version}</version>
</dependency>
+ <dependency>
+ <groupId>org.apache.opennlp</groupId>
+ <artifactId>opennlp-models-tokenizer-hr</artifactId>
+ <version>${project.version}</version>
+ </dependency>
<dependency>
<groupId>org.apache.opennlp</groupId>
<artifactId>opennlp-models-tokenizer-it</artifactId>
@@ -122,6 +132,11 @@ under the License.
<artifactId>opennlp-models-pos-en</artifactId>
<version>${project.version}</version>
</dependency>
+ <dependency>
+ <groupId>org.apache.opennlp</groupId>
+ <artifactId>opennlp-models-pos-hr</artifactId>
+ <version>${project.version}</version>
+ </dependency>
<dependency>
<groupId>org.apache.opennlp</groupId>
<artifactId>opennlp-models-pos-it</artifactId>
diff --git a/opennlp-models-test/src/main/resources/expected-models.txt
b/opennlp-models-test/src/main/resources/expected-models.txt
index be8e69a..eb23f6a 100644
--- a/opennlp-models-test/src/main/resources/expected-models.txt
+++ b/opennlp-models-test/src/main/resources/expected-models.txt
@@ -20,15 +20,17 @@ opennlp-bg-ud-btb-sentence-1.1-2.4.0.bin
opennlp-cs-ud-pdt-sentence-1.1-2.4.0.bin
opennlp-de-ud-gsd-sentence-1.1-2.4.0.bin
opennlp-en-ud-ewt-sentence-1.1-2.4.0.bin
-opennlp-fr-ud-gsd-sentence-1.1-2.4.0.bin
+opennlp-fr-ud-gsd-sentence-1.1-2.4.0.
+opennlp-hr-ud-set-sentence-1.1-2.4.0.bin
opennlp-it-ud-vit-sentence-1.1-2.4.0.bin
opennlp-nl-ud-alpino-sentence-1.1-2.4.0.bin
# POS
opennlp-bg-ud-btb-pos-1.1-2.4.0.bin
opennlp-cs-ud-pdt-pos-1.1-2.4.0.bin
opennlp-de-ud-gsd-pos-1.1-2.4.0.bin
-opennlp-de-ud-gsd-pos-1.1-2.4.0.bin
-opennlp-fr-ud-gsd-pos-1.1-2.4.0.bin
+opennlp-es-ud-gsd-pos-1.1-2.4.0.bin
+opennlp-fr-ud-gsd-pos-1.1-2.4.0.
+opennlp-hr-ud-set-pos-1.1-2.4.0.bin
opennlp-it-ud-vit-pos-1.1-2.4.0.bin
opennlp-nl-ud-alpino-pos-1.1-2.4.0.bin
# Tokens
@@ -37,5 +39,6 @@ opennlp-cs-ud-pdt-tokens-1.1-2.4.0.bin
opennlp-de-ud-gsd-tokens-1.1-2.4.0.bin
opennlp-en-ud-ewt-tokens-1.1-2.4.0.bin
opennlp-fr-ud-gsd-tokens-1.1-2.4.0.bin
+opennlp-hr-ud-set-tokens-1.1-2.4.0.bin
opennlp-it-ud-vit-tokens-1.1-2.4.0.bin
opennlp-nl-ud-alpino-tokens-1.1-2.4.0.bin
\ No newline at end of file
diff --git a/opennlp-models-tokenizer/opennlp-models-tokenizer-hr/pom.xml
b/opennlp-models-tokenizer/opennlp-models-tokenizer-hr/pom.xml
new file mode 100644
index 0000000..a7be66c
--- /dev/null
+++ b/opennlp-models-tokenizer/opennlp-models-tokenizer-hr/pom.xml
@@ -0,0 +1,74 @@
+<?xml version="1.0" encoding="UTF-8"?>
+
+<!--
+Licensed to the Apache Software Foundation (ASF) under one
+or more contributor license agreements. See the NOTICE file
+distributed with this work for additional information
+regarding copyright ownership. The ASF licenses this file
+to you under the Apache License, Version 2.0 (the
+"License"); you may not use this file except in compliance
+with the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing,
+software distributed under the License is distributed on an
+"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+KIND, either express or implied. See the License for the
+specific language governing permissions and limitations
+under the License.
+-->
+
+<project xmlns="http://maven.apache.org/POM/4.0.0"
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
xsi:schemaLocation="http://maven.apache.org/POM/4.0.0
http://maven.apache.org/xsd/maven-4.0.0.xsd">
+ <modelVersion>4.0.0</modelVersion>
+ <parent>
+ <groupId>org.apache.opennlp</groupId>
+ <artifactId>opennlp-models-tokenizer</artifactId>
+ <version>1.1.0-SNAPSHOT</version>
+ </parent>
+
+ <artifactId>opennlp-models-tokenizer-hr</artifactId>
+
+ <name>Apache OpenNLP Models :: Tokenizer :: Croatian</name>
+
+ <properties>
+ <dist.base>${asf.dist.base}</dist.base>
+ <model.family>ud-models-1.1</model.family>
+ <model.name>opennlp-hr-ud-set-tokens-1.1-2.4.0.bin</model.name>
+ <model.version>2.4.0</model.version>
+
<model.sha256>ee76e94fa5b5a218b2e3cb9f781e05cae37cf282d88795358658dafd91408f5d</model.sha256>
+ <model.language>hr</model.language>
+ </properties>
+
+ <build>
+ <resources>
+ <resource>
+ <directory>src/main/resources</directory>
+ <filtering>true</filtering>
+ <includes>
+ <include>**/model.properties</include>
+ </includes>
+ </resource>
+ <resource>
+ <directory>src/main/resources</directory>
+ <includes>
+ <include>**/*.bin</include>
+ </includes>
+ </resource>
+ </resources>
+ <plugins>
+ <plugin>
+ <groupId>com.googlecode.maven-download-plugin</groupId>
+ <artifactId>download-maven-plugin</artifactId>
+ <configuration>
+ <url>${dist.base}/${model.family}/${model.name}</url>
+ </configuration>
+ </plugin>
+ <plugin>
+ <groupId>org.codehaus.mojo</groupId>
+ <artifactId>build-helper-maven-plugin</artifactId>
+ </plugin>
+ </plugins>
+ </build>
+
+</project>
\ No newline at end of file
diff --git
a/opennlp-models-tokenizer/opennlp-models-tokenizer-hr/src/main/resources/model.properties
b/opennlp-models-tokenizer/opennlp-models-tokenizer-hr/src/main/resources/model.properties
new file mode 100644
index 0000000..2be8681
--- /dev/null
+++
b/opennlp-models-tokenizer/opennlp-models-tokenizer-hr/src/main/resources/model.properties
@@ -0,0 +1,19 @@
+# Licensed to the Apache Software Foundation (ASF) under one or more
+# contributor license agreements. See the NOTICE file distributed with
+# this work for additional information regarding copyright ownership.
+# The ASF licenses this file to You under the Apache License, Version 2.0
+# (the "License"); you may not use this file except in compliance with
+# the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+model.name=${model.name}
+model.version=${model.version}
+model.sha256=${model.sha256}
+model.language=${model.language}
\ No newline at end of file
diff --git a/opennlp-models-tokenizer/pom.xml b/opennlp-models-tokenizer/pom.xml
index 14087f6..bbf1292 100644
--- a/opennlp-models-tokenizer/pom.xml
+++ b/opennlp-models-tokenizer/pom.xml
@@ -39,6 +39,7 @@ under the License.
<module>opennlp-models-tokenizer-de</module>
<module>opennlp-models-tokenizer-en</module>
<module>opennlp-models-tokenizer-fr</module>
+ <module>opennlp-models-tokenizer-hr</module>
<module>opennlp-models-tokenizer-it</module>
<module>opennlp-models-tokenizer-nl</module>
</modules>