This is an automated email from the ASF dual-hosted git repository. mawiesne pushed a commit to branch modernize_dependencies_of_opennlp-similarity_component in repository https://gitbox.apache.org/repos/asf/opennlp-sandbox.git
commit a2dbd405b27bc1d0e3c87ed8d5339d0ff7391179 Author: Martin Wiesner <[email protected]> AuthorDate: Sun Feb 12 13:20:42 2023 +0100 modernizes dependencies of opennlp-similarity component - updates several 3rd party dependencies to more recent, conflict free versions - adds missing license headers in `review_builder` package --- opennlp-similarity/pom.xml | 30 +-- .../review_builder/FBOpenGraphSearchManager.java | 24 +- .../review_builder/MachineTranslationWrapper.java | 20 +- .../review_builder/MinedSentenceProcessor.java | 5 +- .../tools/apps/review_builder/ParserConstants.java | 149 ++++++------ .../apps/review_builder/ReviewBuilderRunner.java | 251 +++++++++++---------- .../tools/apps/review_builder/ReviewObj.java | 17 ++ .../review_builder/SentenceBeingOriginalized.java | 19 +- .../apps/review_builder/SentenceOriginalizer.java | 17 ++ .../URLsWithReviewFinderByProductName.java | 19 +- .../review_builder/WebPageReviewExtractor.java | 17 ++ 11 files changed, 358 insertions(+), 210 deletions(-) diff --git a/opennlp-similarity/pom.xml b/opennlp-similarity/pom.xml index 7bc3105..5e2db8d 100644 --- a/opennlp-similarity/pom.xml +++ b/opennlp-similarity/pom.xml @@ -90,12 +90,7 @@ <artifactId>opennlp-tools</artifactId> <version>2.1.0</version> </dependency> - - <dependency> - <groupId>org.slf4j</groupId> - <artifactId>slf4j-log4j12</artifactId> - <version>1.7.33</version> - </dependency> + <dependency> <groupId>org.junit.jupiter</groupId> <artifactId>junit-jupiter-api</artifactId> @@ -123,17 +118,17 @@ <dependency> <groupId>org.json</groupId> <artifactId>json</artifactId> - <version>20090211</version> + <version>20220924</version> </dependency> <dependency> <groupId>org.apache.tika</groupId> <artifactId>tika-app</artifactId> - <version>2.6.0</version> + <version>2.7.0</version> </dependency> <dependency> <groupId>net.sf.opencsv</groupId> <artifactId>opencsv</artifactId> - <version>2.0</version> + <version>2.3</version> </dependency> <dependency> @@ -144,7 +139,7 @@ <dependency> <groupId>commons-codec</groupId> <artifactId>commons-codec</artifactId> - <version>1.13</version> + <version>1.15</version> </dependency> <dependency> <groupId>commons-logging</groupId> @@ -191,7 +186,7 @@ <dependency> <groupId>de.jollyday</groupId> <artifactId>jollyday</artifactId> - <version>0.4.7</version> + <version>0.5.10</version> </dependency> <dependency> <groupId>jgraph</groupId> @@ -206,7 +201,7 @@ <dependency> <groupId>com.restfb</groupId> <artifactId>restfb</artifactId> - <version>1.6.12</version> + <version>1.49.0</version> </dependency> <dependency> <groupId>com.memetix</groupId> @@ -225,6 +220,14 @@ <artifactId>jverbnet</artifactId> <version>1.2.0.1</version> <exclusions> + <exclusion> + <groupId>ch.qos.logback</groupId> + <artifactId>logback-core</artifactId> + </exclusion> + <exclusion> + <groupId>ch.qos.logback</groupId> + <artifactId>logback-classic</artifactId> + </exclusion> <!-- Avoids problems with conflicting slf4j bindings at runtime --> <exclusion> <groupId>org.slf4j</groupId> @@ -236,8 +239,9 @@ <dependency> <groupId>org.docx4j</groupId> <artifactId>docx4j</artifactId> - <version>2.7.1</version> + <version>3.3.7</version> </dependency> + <dependency> <groupId>org.deeplearning4j</groupId> <artifactId>deeplearning4j-core</artifactId> diff --git a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/FBOpenGraphSearchManager.java b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/FBOpenGraphSearchManager.java index 4d6e0dd..c81cad8 100644 --- a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/FBOpenGraphSearchManager.java +++ b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/FBOpenGraphSearchManager.java @@ -1,12 +1,25 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one or more + * contributor license agreements. See the NOTICE file distributed with + * this work for additional information regarding copyright ownership. + * The ASF licenses this file to You under the Apache License, Version 2.0 + * (the "License"); you may not use this file except in compliance with + * the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + package opennlp.tools.apps.review_builder; import java.util.ArrayList; -import java.util.Calendar; import java.util.List; -import org.apache.commons.lang.StringUtils; -import opennlp.tools.jsmlearning.ProfileReaderWriter; -import opennlp.tools.similarity.apps.utils.PageFetcher; import com.restfb.Connection; import com.restfb.DefaultFacebookClient; import com.restfb.FacebookClient; @@ -14,7 +27,10 @@ import com.restfb.Parameter; import com.restfb.exception.FacebookException; import com.restfb.types.Event; import com.restfb.types.Page; +import org.apache.commons.lang.StringUtils; +import opennlp.tools.jsmlearning.ProfileReaderWriter; +import opennlp.tools.similarity.apps.utils.PageFetcher; public class FBOpenGraphSearchManager { diff --git a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/MachineTranslationWrapper.java b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/MachineTranslationWrapper.java index 30ed7e3..1da0423 100644 --- a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/MachineTranslationWrapper.java +++ b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/MachineTranslationWrapper.java @@ -1,3 +1,20 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one or more + * contributor license agreements. See the NOTICE file distributed with + * this work for additional information regarding copyright ownership. + * The ASF licenses this file to You under the Apache License, Version 2.0 + * (the "License"); you may not use this file except in compliance with + * the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + package opennlp.tools.apps.review_builder; import java.io.BufferedReader; @@ -7,10 +24,7 @@ import java.net.MalformedURLException; import java.net.URL; import java.net.URLConnection; import java.net.URLDecoder; -import java.util.HashMap; -import java.util.Map; -import org.apache.commons.lang.StringUtils; import org.json.JSONArray; import org.json.JSONException; import org.json.JSONObject; diff --git a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/MinedSentenceProcessor.java b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/MinedSentenceProcessor.java index b0f0362..cad691a 100644 --- a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/MinedSentenceProcessor.java +++ b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/MinedSentenceProcessor.java @@ -17,13 +17,10 @@ package opennlp.tools.apps.review_builder; -import java.util.Arrays; -import java.util.List; +import org.apache.commons.lang.StringUtils; import opennlp.tools.similarity.apps.utils.Utils; -import org.apache.commons.lang.StringUtils; - public class MinedSentenceProcessor { public static String acceptableMinedSentence(String sent) { // if too many commas => seo text diff --git a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/ParserConstants.java b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/ParserConstants.java index 9862ffb..6ee255a 100644 --- a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/ParserConstants.java +++ b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/ParserConstants.java @@ -1,74 +1,91 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one or more + * contributor license agreements. See the NOTICE file distributed with + * this work for additional information regarding copyright ownership. + * The ASF licenses this file to You under the Apache License, Version 2.0 + * (the "License"); you may not use this file except in compliance with + * the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + package opennlp.tools.apps.review_builder; public interface ParserConstants { // added new POS types for infinitive phrase and participle phrase - public static final String TYPE_STP = "STP"; // infinitive phrase - public static final String TYPE_SGP = "SGP"; // present participle phrase - public static final String TYPE_SNP = "SNP"; // past participle phrase + String TYPE_STP = "STP"; // infinitive phrase + String TYPE_SGP = "SGP"; // present participle phrase + String TYPE_SNP = "SNP"; // past participle phrase // below are the standard POS types, // http://bulba.sdsu.edu/jeanette/thesis/PennTags.html - public static final String TYPE_ADJP = "ADJP"; - public static final String TYPE_ADVP = "ADVP"; - public static final String TYPE_CC = "CC"; - public static final String TYPE_CD = "CD"; - public static final String TYPE_CONJP = "CONJP"; - public static final String TYPE_DT = "DT"; - public static final String TYPE_EX = "EX"; - public static final String TYPE_FRAG = "FRAG"; - public static final String TYPE_FW = "FW"; - public static final String TYPE_IN = "IN"; - public static final String TYPE_INTJ = "INTJ"; - public static final String TYPE_JJ = "JJ"; - public static final String TYPE_JJR = "JJR"; - public static final String TYPE_JJS = "JJS"; - public static final String TYPE_LS = "LS"; - public static final String TYPE_LST = "LST"; - public static final String TYPE_MD = "MD"; - public static final String TYPE_NAC = "NAC"; - public static final String TYPE_NN = "NN"; - public static final String TYPE_NNS = "NNS"; - public static final String TYPE_NNP = "NNP"; - public static final String TYPE_NNPS = "NNPS"; - public static final String TYPE_NP = "NP"; - public static final String TYPE_NX = "NX"; - public static final String TYPE_PDT = "PDT"; - public static final String TYPE_POS = "POS"; - public static final String TYPE_PP = "PP"; - public static final String TYPE_PRN = "PRN"; - public static final String TYPE_PRP = "PRP"; - public static final String TYPE_PRP$ = "PRP$"; - public static final String TYPE_PRT = "PRT"; - public static final String TYPE_QP = "QP"; - public static final String TYPE_RB = "RB"; - public static final String TYPE_RBR = "RBR"; - public static final String TYPE_RBS = "RBS"; - public static final String TYPE_RP = "RP"; - public static final String TYPE_RRC = "RRC"; - public static final String TYPE_S = "S"; - public static final String TYPE_SBAR = "SBAR"; - public static final String TYPE_SBARQ = "SBARQ"; - public static final String TYPE_SINV = "SINV"; - public static final String TYPE_SQ = "SQ"; - public static final String TYPE_SYM = "SYM"; - public static final String TYPE_TO = "TO"; - public static final String TYPE_TOP = "TOP"; - public static final String TYPE_UCP = "UCP"; - public static final String TYPE_UH = "UH"; - public static final String TYPE_VB = "VB"; - public static final String TYPE_VBD = "VBD"; - public static final String TYPE_VBG = "VBG"; - public static final String TYPE_VBN = "VBN"; - public static final String TYPE_VBP = "VBP"; - public static final String TYPE_VBZ = "VBZ"; - public static final String TYPE_VP = "VP"; - public static final String TYPE_WDT = "WDT"; - public static final String TYPE_WHADJP = "WHADJP"; - public static final String TYPE_WHADVP = "WHADVP"; - public static final String TYPE_WHNP = "WHNP"; - public static final String TYPE_WHPP = "WHPP"; - public static final String TYPE_WP = "WP"; - public static final String TYPE_WP$ = "WP$"; - public static final String TYPE_WRB = "WRB"; - public static final String TYPE_X = "X"; + String TYPE_ADJP = "ADJP"; + String TYPE_ADVP = "ADVP"; + String TYPE_CC = "CC"; + String TYPE_CD = "CD"; + String TYPE_CONJP = "CONJP"; + String TYPE_DT = "DT"; + String TYPE_EX = "EX"; + String TYPE_FRAG = "FRAG"; + String TYPE_FW = "FW"; + String TYPE_IN = "IN"; + String TYPE_INTJ = "INTJ"; + String TYPE_JJ = "JJ"; + String TYPE_JJR = "JJR"; + String TYPE_JJS = "JJS"; + String TYPE_LS = "LS"; + String TYPE_LST = "LST"; + String TYPE_MD = "MD"; + String TYPE_NAC = "NAC"; + String TYPE_NN = "NN"; + String TYPE_NNS = "NNS"; + String TYPE_NNP = "NNP"; + String TYPE_NNPS = "NNPS"; + String TYPE_NP = "NP"; + String TYPE_NX = "NX"; + String TYPE_PDT = "PDT"; + String TYPE_POS = "POS"; + String TYPE_PP = "PP"; + String TYPE_PRN = "PRN"; + String TYPE_PRP = "PRP"; + String TYPE_PRP$ = "PRP$"; + String TYPE_PRT = "PRT"; + String TYPE_QP = "QP"; + String TYPE_RB = "RB"; + String TYPE_RBR = "RBR"; + String TYPE_RBS = "RBS"; + String TYPE_RP = "RP"; + String TYPE_RRC = "RRC"; + String TYPE_S = "S"; + String TYPE_SBAR = "SBAR"; + String TYPE_SBARQ = "SBARQ"; + String TYPE_SINV = "SINV"; + String TYPE_SQ = "SQ"; + String TYPE_SYM = "SYM"; + String TYPE_TO = "TO"; + String TYPE_TOP = "TOP"; + String TYPE_UCP = "UCP"; + String TYPE_UH = "UH"; + String TYPE_VB = "VB"; + String TYPE_VBD = "VBD"; + String TYPE_VBG = "VBG"; + String TYPE_VBN = "VBN"; + String TYPE_VBP = "VBP"; + String TYPE_VBZ = "VBZ"; + String TYPE_VP = "VP"; + String TYPE_WDT = "WDT"; + String TYPE_WHADJP = "WHADJP"; + String TYPE_WHADVP = "WHADVP"; + String TYPE_WHNP = "WHNP"; + String TYPE_WHPP = "WHPP"; + String TYPE_WP = "WP"; + String TYPE_WP$ = "WP$"; + String TYPE_WRB = "WRB"; + String TYPE_X = "X"; } diff --git a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/ReviewBuilderRunner.java b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/ReviewBuilderRunner.java index f8dfaa8..6a11ad7 100644 --- a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/ReviewBuilderRunner.java +++ b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/ReviewBuilderRunner.java @@ -1,3 +1,20 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one or more + * contributor license agreements. See the NOTICE file distributed with + * this work for additional information regarding copyright ownership. + * The ASF licenses this file to You under the Apache License, Version 2.0 + * (the "License"); you may not use this file except in compliance with + * the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + package opennlp.tools.apps.review_builder; import java.util.ArrayList; @@ -8,65 +25,65 @@ import opennlp.tools.parse_thicket.Triple; public class ReviewBuilderRunner { - private List<Triple> input = new ArrayList<Triple>(); + private final List<Triple> input = new ArrayList<>(); public ReviewBuilderRunner(){ /* input.add( new Pair<String, Integer>("chief architect portable mobile tv", 204973051)); - input.add( new Pair<String, Integer>("lg plasma tv", 215734562)); - input.add( new Pair<String, Integer>("magnavox lcd hdtv", 215415652)); - input.add( new Pair<String, Integer>("yamaha aventage home theater receiver", 215742271)); - input.add( new Pair<String, Integer>("panasonic 24inch lcd tv", 215742233)); - input.add( new Pair<String, Integer>("otterbox barnes and noble nook commuter case", 215572161)); - input.add( new Pair<String, Integer>("sony kdl32ex340 led tv", 215743925)); - input.add( new Pair<String, Integer>("alpine waterfall tabletop fountain lighting", 215135546)); - input.add( new Pair<String, Integer>("ihome rechargeable speaker system", 215363231 )); - input.add( new Pair<String, Integer>("ion slide film scanner", 212088884)); - - input.add( new Pair<String, Integer>("mens dr martens shoes black nappa", 210813142)); - input.add( new Pair<String, Integer>("calvin klein seamless thong panty", 201984853)); - input.add( new Pair<String, Integer>("mens clarks shoes wallabee beeswax leather", 210808477)); + input.add( new Pair<String, Integer>("lg plasma tv", 215734562)); + input.add( new Pair<String, Integer>("magnavox lcd hdtv", 215415652)); + input.add( new Pair<String, Integer>("yamaha aventage home theater receiver", 215742271)); + input.add( new Pair<String, Integer>("panasonic 24inch lcd tv", 215742233)); + input.add( new Pair<String, Integer>("otterbox barnes and noble nook commuter case", 215572161)); + input.add( new Pair<String, Integer>("sony kdl32ex340 led tv", 215743925)); + input.add( new Pair<String, Integer>("alpine waterfall tabletop fountain lighting", 215135546)); + input.add( new Pair<String, Integer>("ihome rechargeable speaker system", 215363231 )); + input.add( new Pair<String, Integer>("ion slide film scanner", 212088884)); + + input.add( new Pair<String, Integer>("mens dr martens shoes black nappa", 210813142)); + input.add( new Pair<String, Integer>("calvin klein seamless thong panty", 201984853)); + input.add( new Pair<String, Integer>("mens clarks shoes wallabee beeswax leather", 210808477)); //? input.add( new Pair<String, Integer>("mens sperry topsider shoes", 210809238)); - input.add( new Pair<String, Integer>("mens giorgio brutini shoes italian calf", 210809508)); - + input.add( new Pair<String, Integer>("mens giorgio brutini shoes italian calf", 210809508)); + input.add( new Pair<String, Integer>("halo portable backup battery", 1640825398)); -input.add( new Pair<String, Integer>("kenwood pkgmp18 cd receiver coaxial speakers",1642712915)); -input.add( new Pair<String, Integer>("element ultraslim hdtv",1643167865)); -input.add( new Pair<String, Integer>("westinghouse dled hdtv black",1641930013)); -input.add( new Pair<String, Integer>("boss audio receiver speaker package system",1643532459)); -input.add( new Pair<String, Integer>("kenwood cd receiver coaxial speakers bundle",1646566070)); -input.add( new Pair<String, Integer>("element electronics lcd tv black ",1637163018)); -input.add( new Pair<String, Integer>("stunt copter rechargeable battery pack",1636937811)); -input.add( new Pair<String, Integer>("element led ultraslim hdtv soundbar",1637572596)); -input.add( new Pair<String, Integer>("boss receiver speaker package system bundle",1646566067)); -input.add( new Pair<String, Integer>("coby hd tv",1638746307)); -input.add( new Pair<String, Integer>("vizio diag led smart hdtv",1660162001)); -input.add( new Pair<String, Integer>("sony dock for ipad ipod and iphone",1646826284)); -input.add( new Pair<String, Integer>("vizio led ultraslim hdtv",1642018249)); -input.add( new Pair<String, Integer>("lcd kula tv multimedia player",1640265845)); - -input.add(new Pair<String, Integer>("liz and co alex tall leather boots",1630836375)); -input.add( new Pair<String, Integer>("total girl silvia sequin moccasin", 1630828314)); -input.add( new Pair<String, Integer>("new england patriots new era nfl sport sideline knit", 1588531904)); -input.add( new Pair<String, Integer>("betseyville sequin backpack", 1630825375)); -input.add( new Pair<String, Integer>("the north face womens osito jacket mojito", 1639791775)); -input.add( new Pair<String, Integer>("misty harbor raincoat trench removable liner", 903542613)); -input.add(new Pair<String, Integer>("ae womens camo jacket ", 1229070780)); -input.add(new Pair<String, Integer>("indianapolis colts sideline knit", 1588531896)); -input.add(new Pair<String, Integer>("b o c korah boot", 1622401738)); -input.add(new Pair<String, Integer>("adidas mens speed cut track suit", 920744865)); -input.add(new Pair<String, Integer>("liz and co lulu zipper boots", 1630836380)); -input.add(new Pair<String, Integer>("black navy lightweight oxford shoes", 906123996)); -input.add(new Pair<String, Integer>("liz and co farley tall boots", 1639960280)); -input.add(new Pair<String, Integer>("call it spring karpin pullon boots", 1629938981)); -input.add(new Pair<String, Integer>("ugg australia bailey bow boots", 1594029054)); -input.add(new Pair<String, Integer>("dream chasers jacket", 1631247949)); -input.add(new Pair<String, Integer>("guess military tiewaist coat", 1629993909)); -input.add(new Pair<String, Integer>("madden girl allstaar womens zip boots", 1581506993)); -input.add(new Pair<String, Integer>("michael womens shoes", 1590598743)); -input.add(new Pair<String, Integer>("sonoma life style suede midcalf boots women", 1617302927)); - + input.add( new Pair<String, Integer>("kenwood pkgmp18 cd receiver coaxial speakers",1642712915)); + input.add( new Pair<String, Integer>("element ultraslim hdtv",1643167865)); + input.add( new Pair<String, Integer>("westinghouse dled hdtv black",1641930013)); + input.add( new Pair<String, Integer>("boss audio receiver speaker package system",1643532459)); + input.add( new Pair<String, Integer>("kenwood cd receiver coaxial speakers bundle",1646566070)); + input.add( new Pair<String, Integer>("element electronics lcd tv black ",1637163018)); + input.add( new Pair<String, Integer>("stunt copter rechargeable battery pack",1636937811)); + input.add( new Pair<String, Integer>("element led ultraslim hdtv soundbar",1637572596)); + input.add( new Pair<String, Integer>("boss receiver speaker package system bundle",1646566067)); + input.add( new Pair<String, Integer>("coby hd tv",1638746307)); + input.add( new Pair<String, Integer>("vizio diag led smart hdtv",1660162001)); + input.add( new Pair<String, Integer>("sony dock for ipad ipod and iphone",1646826284)); + input.add( new Pair<String, Integer>("vizio led ultraslim hdtv",1642018249)); + input.add( new Pair<String, Integer>("lcd kula tv multimedia player",1640265845)); + + input.add(new Pair<String, Integer>("liz and co alex tall leather boots",1630836375)); + input.add( new Pair<String, Integer>("total girl silvia sequin moccasin", 1630828314)); + input.add( new Pair<String, Integer>("new england patriots new era nfl sport sideline knit", 1588531904)); + input.add( new Pair<String, Integer>("betseyville sequin backpack", 1630825375)); + input.add( new Pair<String, Integer>("the north face womens osito jacket mojito", 1639791775)); + input.add( new Pair<String, Integer>("misty harbor raincoat trench removable liner", 903542613)); + input.add(new Pair<String, Integer>("ae womens camo jacket ", 1229070780)); + input.add(new Pair<String, Integer>("indianapolis colts sideline knit", 1588531896)); + input.add(new Pair<String, Integer>("b o c korah boot", 1622401738)); + input.add(new Pair<String, Integer>("adidas mens speed cut track suit", 920744865)); + input.add(new Pair<String, Integer>("liz and co lulu zipper boots", 1630836380)); + input.add(new Pair<String, Integer>("black navy lightweight oxford shoes", 906123996)); + input.add(new Pair<String, Integer>("liz and co farley tall boots", 1639960280)); + input.add(new Pair<String, Integer>("call it spring karpin pullon boots", 1629938981)); + input.add(new Pair<String, Integer>("ugg australia bailey bow boots", 1594029054)); + input.add(new Pair<String, Integer>("dream chasers jacket", 1631247949)); + input.add(new Pair<String, Integer>("guess military tiewaist coat", 1629993909)); + input.add(new Pair<String, Integer>("madden girl allstaar womens zip boots", 1581506993)); + input.add(new Pair<String, Integer>("michael womens shoes", 1590598743)); + input.add(new Pair<String, Integer>("sonoma life style suede midcalf boots women", 1617302927)); + input.add(new Pair<String, Integer>("absolute pnf300 power noise filterground loop isolator with adjustable controls", 1521965454)); input.add(new Pair<String, Integer>("sennheiser ie8 stereo earbuds", 211969101)); input.add(new Pair<String, Integer>("sanus vlmf109 motorized full motion mount for tvs 37 60 up to 110 lbs", 214893385)); @@ -77,75 +94,73 @@ input.add(new Pair<String, Integer>("sonoma life style suede midcalf boots women input.add(new Pair<String, Integer>("toms bimini stitchout slipon women", 1633012540)); input.add(new Pair<String, Integer>("the north face womens p r tka 100 microvelour glacier 14 zip tnf blackjk3 medium", 1618022193)); input.add(new Pair<String, Integer>("robert graham manuel dress shirt mens long sleeve button up blue", 1631119485)); - + input.add(new Pair<String, Integer>("b o c leesa", 1584193288)); - input.add(new Pair<String, Integer>("blair stirrup pants", 1525621516)); - input.add(new Pair<String, Integer>("donna karan shirtdress", 1463793963)); - input.add(new Pair<String, Integer>("columbia sportswear terminal tackle shirt", 1661238030)); - input.add(new Pair<String, Integer>("carters jersey pajamas", 1573999243)); - input.add(new Pair<String, Integer>("vince camuto dena", 1626272001)); - input.add(new Pair<String, Integer>("pistil hudson knit hats", 1660874149)); - input.add(new Pair<String, Integer>("naturalizer trinity wide shaft womens zip", 1569191459)); - input.add(new Pair<String, Integer>("bare traps chelby womens sandals", 1513387756)); - input.add(new Pair<String, Integer>("overland storage hard drive 1 tb hotswap", 212107374)); - input.add(new Pair<String, Integer>("humminbird indash depth finder", 1616650484)); - input.add(new Pair<String, Integer>("grepsr800 gre dig scanner", 215723895)); - input.add(new Pair<String, Integer>("humminbird kayak transducer", 215392426)); - input.add(new Pair<String, Integer>("garmin nuvi suction cup mount ", 215728710)); - input.add(new Pair<String, Integer>("crosley radio black", 215662289)); - - input.add(new Triple<String, Integer, String >("avaya ip telephone", 1440488008, "lucent phone system")); - input.add(new Triple<String, Integer, String>("clarks trolley womens shoes", 1581854074, "clark womens shoes")); - input.add(new Triple<String, Integer, String>("mens evans shoes imperial deer", 210808400, "lb evans slippers")); - input.add(new Triple<String, Integer, String>("ugg classic bow shorty gloves", 1665094898, "leather gloves women")); - input.add(new Triple<String, Integer, String>("jumping beans man tee baby", 1667155332, "jumping beans clothing")); - input.add(new Triple<String, Integer, String>("asics mens shoes", 1630208773, "asics mens running shoes")); - input.add(new Triple<String, Integer, String>("oakley hoodie mens fleece", 1656661466, "hoodies for men")); - input.add(new Triple<String, Integer, String>("usb sound control digital voice recorder", 1654662662, "digital voice recorder with usb")); - input.add(new Triple<String, Integer, String>("motorola bluetooth headset", 215376254, "motorola oasis bluetooth headset")); - input.add(new Triple<String, Integer, String>("sony sound bar home theater system", 215450833, "sony sound bar")); - input.add(new Triple<String, Integer, String>("jvc full hd everio camcorder", 1664479999, "jvc everio camcorder")); - */ + input.add(new Pair<String, Integer>("blair stirrup pants", 1525621516)); + input.add(new Pair<String, Integer>("donna karan shirtdress", 1463793963)); + input.add(new Pair<String, Integer>("columbia sportswear terminal tackle shirt", 1661238030)); + input.add(new Pair<String, Integer>("carters jersey pajamas", 1573999243)); + input.add(new Pair<String, Integer>("vince camuto dena", 1626272001)); + input.add(new Pair<String, Integer>("pistil hudson knit hats", 1660874149)); + input.add(new Pair<String, Integer>("naturalizer trinity wide shaft womens zip", 1569191459)); + input.add(new Pair<String, Integer>("bare traps chelby womens sandals", 1513387756)); + input.add(new Pair<String, Integer>("overland storage hard drive 1 tb hotswap", 212107374)); + input.add(new Pair<String, Integer>("humminbird indash depth finder", 1616650484)); + input.add(new Pair<String, Integer>("grepsr800 gre dig scanner", 215723895)); + input.add(new Pair<String, Integer>("humminbird kayak transducer", 215392426)); + input.add(new Pair<String, Integer>("garmin nuvi suction cup mount ", 215728710)); + input.add(new Pair<String, Integer>("crosley radio black", 215662289)); + + input.add(new Triple<String, Integer, String >("avaya ip telephone", 1440488008, "lucent phone system")); + input.add(new Triple<>("clarks trolley womens shoes", 1581854074, "clark womens shoes")); + input.add(new Triple<>("mens evans shoes imperial deer", 210808400, "lb evans slippers")); + input.add(new Triple<>("ugg classic bow shorty gloves", 1665094898, "leather gloves women")); + input.add(new Triple<>("jumping beans man tee baby", 1667155332, "jumping beans clothing")); + input.add(new Triple<>("asics mens shoes", 1630208773, "asics mens running shoes")); + input.add(new Triple<>("oakley hoodie mens fleece", 1656661466, "hoodies for men")); + input.add(new Triple<>("usb sound control digital voice recorder", 1654662662, "digital voice recorder with usb")); + input.add(new Triple<>("motorola bluetooth headset", 215376254, "motorola oasis bluetooth headset")); + input.add(new Triple<>("sony sound bar home theater system", 215450833, "sony sound bar")); + input.add(new Triple<>("jvc full hd everio camcorder", 1664479999, "jvc everio camcorder")); + */ - input.add(new Triple<String, Integer, String>("dr martens beckett laceup boots", 1651452641, "doc martin shoes")); - input.add(new Triple<String, Integer, String>("pioneer cd changer",204654672, "pioneer cd player")); - input.add(new Triple<String, Integer, String>("tablet handler strap and desk mount", 1634326303, "tablet holder")); - input.add(new Triple<String, Integer, String>("sockwell loden womens overthecalf socks", 1644572708, "compression stockings, support stockings")); - input.add(new Triple<String, Integer, String>("nike eclipse womens shoes", 1657807048, "nike eclipse ii women s shoe")); - input.add(new Triple<String, Integer, String>("cherokee workwear womens scrub pant black stall",211643295, "cherokee workwear scrubs")); - input.add(new Triple<String, Integer, String>("columbia sportswear jacket ", 1667381935, "columbia omni heat")); - input.add(new Triple<String, Integer, String>("adidas adipure jacket", 1040124787, "adidas track jacket")); - input.add(new Triple<String, Integer, String>("clarks may orchid womens shoes", 1585805688, "clarks loafers")); - input.add(new Triple<String, Integer, String>("levis pants empire blue", 1670283141, "skinny jeans for guys")); - input.add(new Triple<String, Integer, String>("nike jordan black cat tee", 1653598764, "jordan black cat")); - input.add(new Triple<String, Integer, String>("obermeyer womens kassandra down coat", 1670629180, "down winter coats")); + input.add(new Triple<>("dr martens beckett laceup boots", 1651452641, "doc martin shoes")); + input.add(new Triple<>("pioneer cd changer",204654672, "pioneer cd player")); + input.add(new Triple<>("tablet handler strap and desk mount", 1634326303, "tablet holder")); + input.add(new Triple<>("sockwell loden womens overthecalf socks", 1644572708, "compression stockings, support stockings")); + input.add(new Triple<>("nike eclipse womens shoes", 1657807048, "nike eclipse ii women s shoe")); + input.add(new Triple<>("cherokee workwear womens scrub pant black stall",211643295, "cherokee workwear scrubs")); + input.add(new Triple<>("columbia sportswear jacket ", 1667381935, "columbia omni heat")); + input.add(new Triple<>("adidas adipure jacket", 1040124787, "adidas track jacket")); + input.add(new Triple<>("clarks may orchid womens shoes", 1585805688, "clarks loafers")); + input.add(new Triple<>("levis pants empire blue", 1670283141, "skinny jeans for guys")); + input.add(new Triple<>("nike jordan black cat tee", 1653598764, "jordan black cat")); + input.add(new Triple<>("obermeyer womens kassandra down coat", 1670629180, "down winter coats")); /* - input.add(new Triple<String, Integer, String>("paramax surround sound", 835422569, "paramax im3")); - input.add(new Triple<String, Integer, String>("mia quincy wedge", 1285886230, "mia quincy wedge")); - input.add(new Triple<String, Integer, String>("able planet headphones", 1648522886, "able planet nc210g")); - input.add(new Triple<String, Integer, String>("samsung replacement lamp", 695793593, "lamp code bp96")); - input.add(new Triple<String, Integer, String>("paul green emerson boot castagno", 1313967918, "paul green emerson boot")); - input.add(new Triple<String, Integer, String>("bandolino caresse boots", 1448643623, "bandolino caresse boots")); - input.add(new Triple<String, Integer, String>("nine west modiley", 1365998968, "nine west modiley")); - input.add(new Triple<String, Integer, String>("converse chuck taylor bisay", 1555900934, "turquoise chuck taylors")); - input.add(new Triple<String, Integer, String>("gentle souls bay leaf flats", 1436175162, "gentle souls bay leaf")); - input.add(new Triple<String, Integer, String>("sauce hockey back hat", 1644440355, "sauce hockey discount code")); - input.add(new Triple<String, Integer, String>("aravon farren oxford shoes", 1644573438, "aravon wef07sh")); - */ input.add(new Triple<String, Integer, String>("kooba crosby hobo handbags", 1326503038, "kooba crosby")); - input.add(new Triple<String, Integer, String>("bcbgmaxazria sheath dress", 1313949777, "bcbgmaxazria illusion bodice ruched sheath dress")); - input.add(new Triple<String, Integer, String>("billabong boardshorts trunks", 1316823074, "la siesta boardshorts")); - input.add(new Triple<String, Integer, String>("mootsies tootsies boot", 1503727310, "mootsies tootsies draker")); - input.add(new Triple<String, Integer, String>("nine west bootie", 1503730060, "nine west drina")); - input.add(new Triple<String, Integer, String>("playtex support cotton ", 1331026244, "playtex t723")); - input.add(new Triple<String, Integer, String>("fossil morgan satchel taupe", 1355165745, "fossil morgan satchel")); - input.add(new Triple<String, Integer, String>("katonah womens boots brown", 1420057844, "boc katonah boots")); - input.add(new Triple<String, Integer, String>("boot cut jeans supernova", 1363356262, "levis 527 supernova")); - input.add(new Triple<String, Integer, String>("steve madden buckie boot", 1313965918, "steve madden buckie boot")); - input.add(new Triple<String, Integer, String>("charlies horse tshirt", 1428490587, "charlie s horse shirt")); - input.add(new Triple<String, Integer, String>("igloo little playmate ice chest", 205421625, "igloo little playmate")); - input.add(new Triple<String, Integer, String>("mark nason boot", 1313951044, "mark nason rudd")); - - + input.add(new Triple<>("paramax surround sound", 835422569, "paramax im3")); + input.add(new Triple<>("mia quincy wedge", 1285886230, "mia quincy wedge")); + input.add(new Triple<>("able planet headphones", 1648522886, "able planet nc210g")); + input.add(new Triple<>("samsung replacement lamp", 695793593, "lamp code bp96")); + input.add(new Triple<>("paul green emerson boot castagno", 1313967918, "paul green emerson boot")); + input.add(new Triple<>("bandolino caresse boots", 1448643623, "bandolino caresse boots")); + input.add(new Triple<>("nine west modiley", 1365998968, "nine west modiley")); + input.add(new Triple<>("converse chuck taylor bisay", 1555900934, "turquoise chuck taylors")); + input.add(new Triple<>("gentle souls bay leaf flats", 1436175162, "gentle souls bay leaf")); + input.add(new Triple<>("sauce hockey back hat", 1644440355, "sauce hockey discount code")); + input.add(new Triple<>("aravon farren oxford shoes", 1644573438, "aravon wef07sh")); +*/ input.add(new Triple<>("kooba crosby hobo handbags", 1326503038, "kooba crosby")); + input.add(new Triple<>("bcbgmaxazria sheath dress", 1313949777, "bcbgmaxazria illusion bodice ruched sheath dress")); + input.add(new Triple<>("billabong boardshorts trunks", 1316823074, "la siesta boardshorts")); + input.add(new Triple<>("mootsies tootsies boot", 1503727310, "mootsies tootsies draker")); + input.add(new Triple<>("nine west bootie", 1503730060, "nine west drina")); + input.add(new Triple<>("playtex support cotton ", 1331026244, "playtex t723")); + input.add(new Triple<>("fossil morgan satchel taupe", 1355165745, "fossil morgan satchel")); + input.add(new Triple<>("katonah womens boots brown", 1420057844, "boc katonah boots")); + input.add(new Triple<>("boot cut jeans supernova", 1363356262, "levis 527 supernova")); + input.add(new Triple<>("steve madden buckie boot", 1313965918, "steve madden buckie boot")); + input.add(new Triple<>("charlies horse tshirt", 1428490587, "charlie s horse shirt")); + input.add(new Triple<>("igloo little playmate ice chest", 205421625, "igloo little playmate")); + input.add(new Triple<>("mark nason boot", 1313951044, "mark nason rudd")); } diff --git a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/ReviewObj.java b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/ReviewObj.java index 537fdf9..0c23938 100644 --- a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/ReviewObj.java +++ b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/ReviewObj.java @@ -1,3 +1,20 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one or more + * contributor license agreements. See the NOTICE file distributed with + * this work for additional information regarding copyright ownership. + * The ASF licenses this file to You under the Apache License, Version 2.0 + * (the "License"); you may not use this file except in compliance with + * the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + package opennlp.tools.apps.review_builder; import java.util.List; diff --git a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/SentenceBeingOriginalized.java b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/SentenceBeingOriginalized.java index 9c87e7f..739f54d 100644 --- a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/SentenceBeingOriginalized.java +++ b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/SentenceBeingOriginalized.java @@ -1,3 +1,20 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one or more + * contributor license agreements. See the NOTICE file distributed with + * this work for additional information regarding copyright ownership. + * The ASF licenses this file to You under the Apache License, Version 2.0 + * (the "License"); you may not use this file except in compliance with + * the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + package opennlp.tools.apps.review_builder; import java.util.HashMap; @@ -7,7 +24,7 @@ import java.util.Map; import opennlp.tools.textsimilarity.ParseTreeChunk; public class SentenceBeingOriginalized { - private Map<String, String> sentKey_value= new HashMap<String, String>(); + private Map<String, String> sentKey_value = new HashMap<String, String>(); private String sentence; private List<List<ParseTreeChunk>> groupedChunks; diff --git a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/SentenceOriginalizer.java b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/SentenceOriginalizer.java index 1e53d2a..4fddc14 100644 --- a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/SentenceOriginalizer.java +++ b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/SentenceOriginalizer.java @@ -1,3 +1,20 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one or more + * contributor license agreements. See the NOTICE file distributed with + * this work for additional information regarding copyright ownership. + * The ASF licenses this file to You under the Apache License, Version 2.0 + * (the "License"); you may not use this file except in compliance with + * the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + package opennlp.tools.apps.review_builder; import java.util.ArrayList; diff --git a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/URLsWithReviewFinderByProductName.java b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/URLsWithReviewFinderByProductName.java index c573e46..31d3cd4 100644 --- a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/URLsWithReviewFinderByProductName.java +++ b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/URLsWithReviewFinderByProductName.java @@ -1,3 +1,20 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one or more + * contributor license agreements. See the NOTICE file distributed with + * this work for additional information regarding copyright ownership. + * The ASF licenses this file to You under the Apache License, Version 2.0 + * (the "License"); you may not use this file except in compliance with + * the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + package opennlp.tools.apps.review_builder; import java.util.ArrayList; @@ -7,7 +24,7 @@ import opennlp.tools.similarity.apps.BingQueryRunner; import opennlp.tools.similarity.apps.HitBase; public class URLsWithReviewFinderByProductName { -BingQueryRunner search = new BingQueryRunner(); + BingQueryRunner search = new BingQueryRunner(); public List<String> findFacebookURLByNameAndZip(String name){ List<HitBase> foundFBPages = search.runSearch(name, 20); diff --git a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/WebPageReviewExtractor.java b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/WebPageReviewExtractor.java index de3f5a6..2120830 100644 --- a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/WebPageReviewExtractor.java +++ b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/WebPageReviewExtractor.java @@ -1,3 +1,20 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one or more + * contributor license agreements. See the NOTICE file distributed with + * this work for additional information regarding copyright ownership. + * The ASF licenses this file to You under the Apache License, Version 2.0 + * (the "License"); you may not use this file except in compliance with + * the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + */ + package opennlp.tools.apps.review_builder; import java.util.ArrayList;
