ANY23-321 Add openie toggle functionality to service
Project: http://git-wip-us.apache.org/repos/asf/any23/repo Commit: http://git-wip-us.apache.org/repos/asf/any23/commit/63ffc9e3 Tree: http://git-wip-us.apache.org/repos/asf/any23/tree/63ffc9e3 Diff: http://git-wip-us.apache.org/repos/asf/any23/diff/63ffc9e3 Branch: refs/heads/master Commit: 63ffc9e3e8a8da0b4af7ca5b227f1e199e545227 Parents: 4f40fe0 482e780 Author: Lewis John McGibbney <[email protected]> Authored: Fri Feb 2 21:55:12 2018 -0800 Committer: Lewis John McGibbney <[email protected]> Committed: Fri Feb 2 21:55:12 2018 -0800 ---------------------------------------------------------------------- LICENSE-header.txt | 41 -- NOTICE.txt | 2 +- RELEASE-NOTES.txt | 66 ++ api/pom.xml | 2 +- .../main/java/org/apache/any23/vocab/YAML.java | 13 +- .../resources/default-configuration.properties | 4 + cli/pom.xml | 2 +- .../org/apache/any23/cli/SimpleRoverTest.java | 13 +- .../org/apache/any23/cli/YAMLRoverTest.java | 13 +- cli/src/test/resources/log4j.properties | 15 +- core/pom.xml | 6 +- .../extractor/html/EmbeddedJSONLDExtractor.java | 8 +- .../any23/extractor/html/HCardExtractor.java | 3 +- .../any23/extractor/html/HTMLMetaExtractor.java | 6 +- .../apache/any23/extractor/html/JsoupUtils.java | 103 ++++ .../any23/extractor/html/TagSoupParser.java | 172 +++--- .../html/TagSoupParsingConfiguration.java | 181 ++++++ .../any23/extractor/rdf/BaseRDFExtractor.java | 46 +- .../html/EmbeddedJSONLDExtractorTest.java | 14 + .../microdata/MicrodataParserTest.java | 5 +- .../extractor/rdfa/RDFa11ExtractorTest.java | 41 +- csvutils/pom.xml | 2 +- encoding/pom.xml | 2 +- mime/pom.xml | 2 +- plugins/basic-crawler/pom.xml | 10 +- plugins/html-scraper/pom.xml | 4 +- plugins/integration-test/pom.xml | 2 +- plugins/office-scraper/pom.xml | 4 +- plugins/openie/pom.xml | 2 +- pom.xml | 14 +- service/pom.xml | 2 +- .../main/assembly/NOTICE-server-embedded.txt | 2 +- service/src/main/assembly/NOTICE-with-deps.txt | 2 +- .../src/main/assembly/NOTICE-without-deps.txt | 2 +- test-resources/pom.xml | 2 +- .../html-body-embedded-jsonld-extractor.html | 37 ++ ...head-and-body-embedded-jsonld-extractor.html | 47 ++ .../test/resources/html/rdfa/rdfa-issue227.html | 40 ++ .../html/rdfa/rdfa-issue268-and-317.html | 613 +++++++++++++++++++ .../html/rdfa/rdfa-issue271-and-317.html | 251 ++++++++ .../html/rdfa/rdfa-issue273-and-317.html | 143 +++++ .../html/rdfa/rdfa-issue326-and-267.html | 20 + 42 files changed, 1777 insertions(+), 182 deletions(-) ---------------------------------------------------------------------- http://git-wip-us.apache.org/repos/asf/any23/blob/63ffc9e3/plugins/integration-test/pom.xml ---------------------------------------------------------------------- http://git-wip-us.apache.org/repos/asf/any23/blob/63ffc9e3/plugins/openie/pom.xml ---------------------------------------------------------------------- diff --cc plugins/openie/pom.xml index 64c6806,0000000..0f34ad5 mode 100644,000000..100644 --- a/plugins/openie/pom.xml +++ b/plugins/openie/pom.xml @@@ -1,165 -1,0 +1,165 @@@ +<?xml version="1.0" encoding="UTF-8"?> +<!-- + Licensed to the Apache Software Foundation (ASF) under one or more + contributor license agreements. See the NOTICE file distributed with + this work for additional information regarding copyright ownership. + The ASF licenses this file to You under the Apache License, Version 2.0 + (the "License"); you may not use this file except in compliance with + the License. You may obtain a copy of the License at + + http://www.apache.org/licenses/LICENSE-2.0 + + Unless required by applicable law or agreed to in writing, software + distributed under the License is distributed on an "AS IS" BASIS, + WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + See the License for the specific language governing permissions and + limitations under the License. +--> +<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/maven-v4_0_0.xsd"> + <modelVersion>4.0.0</modelVersion> + + <parent> + <groupId>org.apache.any23</groupId> + <artifactId>apache-any23</artifactId> - <version>2.2-SNAPSHOT</version> ++ <version>2.3-SNAPSHOT</version> + <relativePath>../../pom.xml</relativePath> + </parent> + + <groupId>org.apache.any23.plugins</groupId> + <artifactId>apache-any23-openie</artifactId> + + <name>Apache Any23 :: Plugins :: OpenIE</name> + <description>Open Information Extraction module.</description> + + <repositories> + <repository> + <snapshots> + <enabled>false</enabled> + </snapshots> + <id>bintray-allenai-maven</id> + <name>bintray</name> + <url>http://allenai.bintray.com/maven</url> + </repository> + </repositories> + <pluginRepositories> + <pluginRepository> + <snapshots> + <enabled>false</enabled> + </snapshots> + <id>bintray-allenai-maven</id> + <name>bintray-plugins</name> + <url>http://allenai.bintray.com/maven</url> + </pluginRepository> + </pluginRepositories> + + <dependencies> + <dependency> + <groupId>org.apache.any23</groupId> + <artifactId>apache-any23-core</artifactId> + <version>${project.version}</version> + <scope>provided</scope> + </dependency> + <dependency> + <groupId>org.apache.any23</groupId> + <artifactId>apache-any23-test-resources</artifactId> + <version>${project.version}</version> + <scope>test</scope> + <type>test-jar</type> + </dependency> + <dependency> + <groupId>org.allenai.openie</groupId> + <artifactId>openie_2.11</artifactId> + <version>${openie_2.11.version}</version> + <scope>compile</scope> + </dependency> + <dependency> + <groupId>org.allenai.openie</groupId> + <artifactId>openie_2.11</artifactId> + <version>${openie_2.11.version}</version> + <scope>compile</scope> + <type>pom</type> + </dependency> + <dependency> + <groupId>edu.washington.cs.knowitall</groupId> + <artifactId>openregex</artifactId> + <version>${openregex.version}</version> + <scope>runtime</scope> + </dependency> + <dependency> + <groupId>junit</groupId> + <artifactId>junit</artifactId> + <scope>test</scope> + </dependency> + <dependency> + <groupId>org.slf4j</groupId> + <artifactId>slf4j-log4j12</artifactId> + <scope>test</scope> + </dependency> + </dependencies> + + <build> + <plugins> + <plugin> + <groupId>org.apache.maven.plugins</groupId> + <artifactId>maven-surefire-plugin</artifactId> + <configuration> + <skipTests>true</skipTests> + </configuration> + </plugin> + <!-- Generates the distribution package --> + <plugin> + <groupId>org.apache.maven.plugins</groupId> + <artifactId>maven-assembly-plugin</artifactId> + <configuration> + <appendAssemblyId>false</appendAssemblyId> + <descriptors> + <descriptor>${basedir}/src/main/assembly/bin.xml</descriptor> + </descriptors> + </configuration> + </plugin> + </plugins> + <pluginManagement> + <plugins> + <plugin> + <groupId>org.apache.maven.plugins</groupId> + <artifactId>maven-assembly-plugin</artifactId> + <version>${maven-assembly-plugin.version}</version> + <executions> + <execution> + <id>assembly</id> + <phase>package</phase> + <goals> + <goal>single</goal> + </goals> + </execution> + </executions> + <configuration> + <attach>true</attach> + <skipAssembly>true</skipAssembly> + <tarLongFileMode>gnu</tarLongFileMode> + </configuration> + </plugin> + </plugins> + </pluginManagement> + </build> + + <profiles> + <profile> + <id>release</id> + <build> + <resources> + <resource> + <directory>${basedir}/../</directory> + <targetPath>${project.build.directory}/apidocs/META-INF</targetPath> + <includes> + <include>LICENSE.txt</include> + <include>NOTICE.txt</include> + </includes> + </resource> + </resources> + </build> + </profile> + + </profiles> + +</project> http://git-wip-us.apache.org/repos/asf/any23/blob/63ffc9e3/pom.xml ---------------------------------------------------------------------- http://git-wip-us.apache.org/repos/asf/any23/blob/63ffc9e3/service/pom.xml ----------------------------------------------------------------------
