This is an automated email from the ASF dual-hosted git repository.
mawiesne pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/opennlp-sandbox.git
The following commit(s) were added to refs/heads/main by this push:
new 494aa2e9 Addresses known security vulnerabilities in commons-lang and
jdom (#470)
494aa2e9 is described below
commit 494aa2e9b8039f3d259c54208dccf8fc86cdb1e5
Author: Richard Zowalla <[email protected]>
AuthorDate: Tue May 12 12:34:46 2026 +0200
Addresses known security vulnerabilities in commons-lang and jdom (#470)
* Addresses known security vulnerabilities in commons-lang and jdom
- Bumps org.jdom:jdom:2.0.2 to org.jdom:jdom2:2.0.6.1 in mallet-addon
(CVE-2021-33813)
- Drops legacy commons-lang 2.6 and migrates opennlp-similarity sources to
commons-lang3 (CVE-2025-48924)
- Replaces removed StringEscapeUtils.unescapeHtml with commons-text
StringEscapeUtils.unescapeHtml4
- Adds commons-text 1.14.0 to dependencyManagement
* Drops obsolete jdom and bsh deps from mallet-addon
Mallet 2.1.0 no longer requires jdom or beanshell; both were
leftovers from older mallet versions. Verified neither artifact
is referenced in mallet-2.1.0.jar bytecode.
---
mallet-addon/pom.xml | 18 ------------------
opennlp-similarity/pom.xml | 8 ++++++++
.../tools/apps/relevanceVocabs/PhraseProcessor.java | 2 +-
.../apps/review_builder/MinedSentenceProcessor.java | 2 +-
.../apps/review_builder/SentenceOriginalizer.java | 2 +-
.../apps/review_builder/WebPageReviewExtractor.java | 2 +-
.../opennlp/tools/doc_classifier/DocClassifier.java | 2 +-
.../DocClassifierTrainingSetMultilingualExtender.java | 2 +-
.../jsmlearning/FeatureSpaceCoverageProcessor.java | 2 +-
.../apps/MostFrequentWordsFromPageGetter.java | 2 +-
.../tools/parse_thicket/apps/SnippetToParagraph.java | 2 +-
.../apps/WebPageContentSentenceExtractor.java | 2 +-
.../tools/parse_thicket/apps/WebPageExtractor.java | 2 +-
.../tools/similarity/apps/ContentGeneratorSupport.java | 2 +-
.../similarity/apps/GeneratedSentenceProcessor.java | 2 +-
.../similarity/apps/GoogleAutoCompleteQueryRunner.java | 2 +-
.../java/opennlp/tools/similarity/apps/HitBase.java | 2 +-
.../tools/similarity/apps/RelatedSentenceFinder.java | 2 +-
.../tools/similarity/apps/StoryDiscourseNavigator.java | 2 +-
.../similarity/apps/WebSearchEngineResultsScraper.java | 2 +-
.../similarity/apps/solr/IterativeQueryComponent.java | 2 +-
.../apps/solr/IterativeSearchRequestHandler.java | 4 ++--
.../apps/solr/NLProgram2CodeRequestHandler.java | 2 +-
.../apps/solr/SearchResultsReRankerRequestHandler.java | 2 +-
.../similarity/apps/solr/SyntGenRequestHandler.java | 4 ++--
.../apps/taxo_builder/DomainTaxonomyExtender.java | 2 +-
.../opennlp/tools/similarity/apps/utils/Utils.java | 4 ++--
.../tools/textsimilarity/SentencePairMatchResult.java | 2 +-
.../opennlp/tools/textsimilarity/TextProcessor.java | 2 +-
pom.xml | 12 ++++++------
30 files changed, 44 insertions(+), 54 deletions(-)
diff --git a/mallet-addon/pom.xml b/mallet-addon/pom.xml
index 6900c872..48237abb 100644
--- a/mallet-addon/pom.xml
+++ b/mallet-addon/pom.xml
@@ -48,26 +48,8 @@
<groupId>junit</groupId>
<artifactId>junit</artifactId>
</exclusion>
- <exclusion>
- <groupId>org.jdom</groupId>
- <artifactId>jdom</artifactId>
- </exclusion>
- <exclusion>
- <groupId>org.beanshell</groupId>
- <artifactId>bsh</artifactId>
- </exclusion>
</exclusions>
</dependency>
- <dependency>
- <groupId>org.jdom</groupId>
- <artifactId>jdom</artifactId>
- <version>2.0.2</version>
- </dependency>
- <dependency>
- <groupId>org.apache-extras.beanshell</groupId>
- <artifactId>bsh</artifactId>
- <version>2.0b6</version>
- </dependency>
</dependencies>
<build>
diff --git a/opennlp-similarity/pom.xml b/opennlp-similarity/pom.xml
index 2bce9a01..65b503dc 100644
--- a/opennlp-similarity/pom.xml
+++ b/opennlp-similarity/pom.xml
@@ -110,6 +110,14 @@
<groupId>org.apache.commons</groupId>
<artifactId>commons-collections4</artifactId>
</dependency>
+ <dependency>
+ <groupId>org.apache.commons</groupId>
+ <artifactId>commons-lang3</artifactId>
+ </dependency>
+ <dependency>
+ <groupId>org.apache.commons</groupId>
+ <artifactId>commons-text</artifactId>
+ </dependency>
<dependency>
<groupId>jakarta.xml.bind</groupId>
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/apps/relevanceVocabs/PhraseProcessor.java
b/opennlp-similarity/src/main/java/opennlp/tools/apps/relevanceVocabs/PhraseProcessor.java
index 013ad90a..ccdc1035 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/apps/relevanceVocabs/PhraseProcessor.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/apps/relevanceVocabs/PhraseProcessor.java
@@ -20,7 +20,7 @@ package opennlp.tools.apps.relevanceVocabs;
import java.util.ArrayList;
import java.util.List;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
import opennlp.tools.parser.Parse;
import opennlp.tools.textsimilarity.ParseTreeChunk;
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/MinedSentenceProcessor.java
b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/MinedSentenceProcessor.java
index e5590e71..ee9c7775 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/MinedSentenceProcessor.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/MinedSentenceProcessor.java
@@ -17,7 +17,7 @@
package opennlp.tools.apps.review_builder;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
import opennlp.tools.similarity.apps.utils.Utils;
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/SentenceOriginalizer.java
b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/SentenceOriginalizer.java
index 7b900dfc..030ae928 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/SentenceOriginalizer.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/SentenceOriginalizer.java
@@ -23,7 +23,7 @@ import java.util.HashSet;
import java.util.List;
import java.util.Random;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
import opennlp.tools.apps.relevanceVocabs.PhraseProcessor;
import opennlp.tools.apps.relevanceVocabs.SentimentVocab;
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/WebPageReviewExtractor.java
b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/WebPageReviewExtractor.java
index 4285f0d4..3644294f 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/WebPageReviewExtractor.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/apps/review_builder/WebPageReviewExtractor.java
@@ -28,7 +28,7 @@ import
opennlp.tools.similarity.apps.utils.StringDistanceMeasurer;
import opennlp.tools.similarity.apps.utils.Utils;
import opennlp.tools.textsimilarity.TextProcessor;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/doc_classifier/DocClassifier.java
b/opennlp-similarity/src/main/java/opennlp/tools/doc_classifier/DocClassifier.java
index 5f502774..3aee84c3 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/doc_classifier/DocClassifier.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/doc_classifier/DocClassifier.java
@@ -24,7 +24,7 @@ import java.util.List;
import java.util.Map;
import java.util.Scanner;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
import org.apache.lucene.analysis.Analyzer;
import org.apache.lucene.analysis.standard.StandardAnalyzer;
import org.apache.lucene.document.Document;
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/doc_classifier/DocClassifierTrainingSetMultilingualExtender.java
b/opennlp-similarity/src/main/java/opennlp/tools/doc_classifier/DocClassifierTrainingSetMultilingualExtender.java
index 18d778cf..d4d80952 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/doc_classifier/DocClassifierTrainingSetMultilingualExtender.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/doc_classifier/DocClassifierTrainingSetMultilingualExtender.java
@@ -32,7 +32,7 @@ import java.util.ArrayList;
import java.util.HashSet;
import java.util.List;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
/*
* This utility gets 'training_corpus' as input and creates a new version of
training_corpus with verified files.
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/jsmlearning/FeatureSpaceCoverageProcessor.java
b/opennlp-similarity/src/main/java/opennlp/tools/jsmlearning/FeatureSpaceCoverageProcessor.java
index c8094664..5eddadef 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/jsmlearning/FeatureSpaceCoverageProcessor.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/jsmlearning/FeatureSpaceCoverageProcessor.java
@@ -22,7 +22,7 @@ import java.util.HashMap;
import java.util.List;
import java.util.Map;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
public class FeatureSpaceCoverageProcessor {
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/parse_thicket/apps/MostFrequentWordsFromPageGetter.java
b/opennlp-similarity/src/main/java/opennlp/tools/parse_thicket/apps/MostFrequentWordsFromPageGetter.java
index 54c0b8b9..85a46600 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/parse_thicket/apps/MostFrequentWordsFromPageGetter.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/parse_thicket/apps/MostFrequentWordsFromPageGetter.java
@@ -22,7 +22,7 @@ import java.util.List;
import java.util.Map;
import java.util.Scanner;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
import opennlp.tools.similarity.apps.utils.ValueSortMap;
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/parse_thicket/apps/SnippetToParagraph.java
b/opennlp-similarity/src/main/java/opennlp/tools/parse_thicket/apps/SnippetToParagraph.java
index c22ba9fe..82d2ef93 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/parse_thicket/apps/SnippetToParagraph.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/parse_thicket/apps/SnippetToParagraph.java
@@ -22,7 +22,7 @@ import java.util.Arrays;
import java.util.Comparator;
import java.util.List;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
import opennlp.tools.similarity.apps.ContentGeneratorSupport;
import opennlp.tools.similarity.apps.Fragment;
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/parse_thicket/apps/WebPageContentSentenceExtractor.java
b/opennlp-similarity/src/main/java/opennlp/tools/parse_thicket/apps/WebPageContentSentenceExtractor.java
index df0c6c0b..31d139f7 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/parse_thicket/apps/WebPageContentSentenceExtractor.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/parse_thicket/apps/WebPageContentSentenceExtractor.java
@@ -23,7 +23,7 @@ import java.util.List;
import opennlp.tools.similarity.apps.GeneratedSentenceProcessor;
import opennlp.tools.similarity.apps.HitBase;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
public class WebPageContentSentenceExtractor extends WebPageExtractor {
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/parse_thicket/apps/WebPageExtractor.java
b/opennlp-similarity/src/main/java/opennlp/tools/parse_thicket/apps/WebPageExtractor.java
index 94960e5c..3291f65c 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/parse_thicket/apps/WebPageExtractor.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/parse_thicket/apps/WebPageExtractor.java
@@ -22,7 +22,7 @@ import java.util.Arrays;
import java.util.Comparator;
import java.util.List;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
import opennlp.tools.similarity.apps.GeneratedSentenceProcessor;
import opennlp.tools.similarity.apps.utils.PageFetcher;
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/ContentGeneratorSupport.java
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/ContentGeneratorSupport.java
index abdb60c3..a71b8651 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/ContentGeneratorSupport.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/ContentGeneratorSupport.java
@@ -29,7 +29,7 @@ import opennlp.tools.textsimilarity.ParseTreeChunk;
import opennlp.tools.textsimilarity.TextProcessor;
import
opennlp.tools.textsimilarity.chunker2matcher.ParserChunker2MatcherProcessor;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/GeneratedSentenceProcessor.java
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/GeneratedSentenceProcessor.java
index d94c1c2c..d33d33e9 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/GeneratedSentenceProcessor.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/GeneratedSentenceProcessor.java
@@ -21,7 +21,7 @@ import java.lang.invoke.MethodHandles;
import java.util.Arrays;
import java.util.List;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
import opennlp.tools.similarity.apps.utils.Utils;
import org.slf4j.Logger;
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/GoogleAutoCompleteQueryRunner.java
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/GoogleAutoCompleteQueryRunner.java
index 2549c297..ec6b0a41 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/GoogleAutoCompleteQueryRunner.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/GoogleAutoCompleteQueryRunner.java
@@ -22,7 +22,7 @@ import java.util.ArrayList;
import java.util.Arrays;
import java.util.List;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
import opennlp.tools.similarity.apps.utils.PageFetcher;
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/HitBase.java
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/HitBase.java
index 5b1dfdd1..2e5688e1 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/HitBase.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/HitBase.java
@@ -23,7 +23,7 @@ import java.util.logging.Logger;
import opennlp.tools.similarity.apps.utils.StringDistanceMeasurer;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
public class HitBase {
private static final Logger LOG = Logger
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/RelatedSentenceFinder.java
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/RelatedSentenceFinder.java
index 19561d38..4e0799db 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/RelatedSentenceFinder.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/RelatedSentenceFinder.java
@@ -25,7 +25,7 @@ import java.util.HashSet;
import java.util.List;
import java.util.Set;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
import opennlp.tools.parse_thicket.Triple;
import opennlp.tools.similarity.apps.utils.PageFetcher;
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/StoryDiscourseNavigator.java
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/StoryDiscourseNavigator.java
index f9cf47e4..3fce1ecd 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/StoryDiscourseNavigator.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/StoryDiscourseNavigator.java
@@ -23,7 +23,7 @@ import java.util.Collection;
import java.util.HashSet;
import java.util.List;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
import opennlp.tools.similarity.apps.utils.PageFetcher;
import opennlp.tools.similarity.apps.utils.StringCleaner;
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/WebSearchEngineResultsScraper.java
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/WebSearchEngineResultsScraper.java
index 9ff771d4..9305e294 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/WebSearchEngineResultsScraper.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/WebSearchEngineResultsScraper.java
@@ -30,7 +30,7 @@ import java.util.List;
import java.util.Map;
import java.util.Set;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
public class WebSearchEngineResultsScraper {
public WebSearchEngineResultsScraper(){
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/solr/IterativeQueryComponent.java
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/solr/IterativeQueryComponent.java
index c427366d..8b25b0e6 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/solr/IterativeQueryComponent.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/solr/IterativeQueryComponent.java
@@ -20,7 +20,7 @@ import java.io.IOException;
import java.util.ArrayList;
import java.util.List;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
import org.apache.lucene.search.BooleanQuery;
import org.apache.lucene.search.Query;
import org.apache.solr.common.params.CommonParams;
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/solr/IterativeSearchRequestHandler.java
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/solr/IterativeSearchRequestHandler.java
index 1cba60a9..888fb8bc 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/solr/IterativeSearchRequestHandler.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/solr/IterativeSearchRequestHandler.java
@@ -25,8 +25,8 @@ import java.util.List;
import java.util.Map;
import java.util.Set;
-import org.apache.commons.lang.ArrayUtils;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.ArrayUtils;
+import org.apache.commons.lang3.StringUtils;
import org.apache.lucene.document.Document;
import org.apache.lucene.index.CorruptIndexException;
import org.apache.lucene.index.IndexReader;
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/solr/NLProgram2CodeRequestHandler.java
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/solr/NLProgram2CodeRequestHandler.java
index 42e2ecf8..eb117435 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/solr/NLProgram2CodeRequestHandler.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/solr/NLProgram2CodeRequestHandler.java
@@ -23,7 +23,7 @@ import opennlp.tools.nl2code.NL2ObjCreateAssign;
import opennlp.tools.nl2code.ObjectPhraseListForSentence;
import opennlp.tools.textsimilarity.ParseTreeChunkListScorer;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
import org.apache.solr.common.util.NamedList;
import org.apache.solr.handler.component.SearchHandler;
import org.apache.solr.request.SolrQueryRequest;
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/solr/SearchResultsReRankerRequestHandler.java
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/solr/SearchResultsReRankerRequestHandler.java
index c7345fc5..9dd96af7 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/solr/SearchResultsReRankerRequestHandler.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/solr/SearchResultsReRankerRequestHandler.java
@@ -28,7 +28,7 @@ import opennlp.tools.textsimilarity.ParseTreeChunkListScorer;
import opennlp.tools.textsimilarity.SentencePairMatchResult;
import
opennlp.tools.textsimilarity.chunker2matcher.ParserChunker2MatcherProcessor;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
import org.apache.solr.common.params.SolrParams;
import org.apache.solr.common.util.NamedList;
import org.apache.solr.handler.component.SearchHandler;
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/solr/SyntGenRequestHandler.java
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/solr/SyntGenRequestHandler.java
index bf78e15b..b6b8be79 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/solr/SyntGenRequestHandler.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/solr/SyntGenRequestHandler.java
@@ -31,8 +31,8 @@ import opennlp.tools.textsimilarity.ParseTreeChunkListScorer;
import opennlp.tools.textsimilarity.SentencePairMatchResult;
import
opennlp.tools.textsimilarity.chunker2matcher.ParserChunker2MatcherProcessor;
-import org.apache.commons.lang.ArrayUtils;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.ArrayUtils;
+import org.apache.commons.lang3.StringUtils;
import org.apache.lucene.document.Document;
import org.apache.lucene.index.CorruptIndexException;
import org.apache.lucene.index.IndexReader;
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/taxo_builder/DomainTaxonomyExtender.java
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/taxo_builder/DomainTaxonomyExtender.java
index c346d35a..afe8ff1b 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/taxo_builder/DomainTaxonomyExtender.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/taxo_builder/DomainTaxonomyExtender.java
@@ -26,7 +26,7 @@ import java.util.HashSet;
import java.util.List;
import java.util.Map;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
import org.slf4j.LoggerFactory;
import opennlp.tools.similarity.apps.HitBase;
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/utils/Utils.java
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/utils/Utils.java
index 4fd8a177..c63faaae 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/utils/Utils.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/similarity/apps/utils/Utils.java
@@ -26,7 +26,7 @@ import java.util.List;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
public class Utils {
@@ -437,7 +437,7 @@ public class Utils {
}
public static String unescapeHTML(String text) {
- return org.apache.commons.lang.StringEscapeUtils.unescapeHtml(text);
+ return org.apache.commons.text.StringEscapeUtils.unescapeHtml4(text);
}
public static String stripHTML(String text) {
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/textsimilarity/SentencePairMatchResult.java
b/opennlp-similarity/src/main/java/opennlp/tools/textsimilarity/SentencePairMatchResult.java
index de13ae33..1650aa84 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/textsimilarity/SentencePairMatchResult.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/textsimilarity/SentencePairMatchResult.java
@@ -19,7 +19,7 @@ package opennlp.tools.textsimilarity;
import java.util.List;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
public class SentencePairMatchResult {
private List<List<ParseTreeChunk>> matchResult;
diff --git
a/opennlp-similarity/src/main/java/opennlp/tools/textsimilarity/TextProcessor.java
b/opennlp-similarity/src/main/java/opennlp/tools/textsimilarity/TextProcessor.java
index cae45654..d3005ca0 100644
---
a/opennlp-similarity/src/main/java/opennlp/tools/textsimilarity/TextProcessor.java
+++
b/opennlp-similarity/src/main/java/opennlp/tools/textsimilarity/TextProcessor.java
@@ -32,7 +32,7 @@ import java.util.logging.Logger;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
-import org.apache.commons.lang.StringUtils;
+import org.apache.commons.lang3.StringUtils;
import opennlp.tools.similarity.apps.utils.Pair;
import opennlp.tools.stemmer.PorterStemmer;
diff --git a/pom.xml b/pom.xml
index ac231c48..f822e1bd 100644
--- a/pom.xml
+++ b/pom.xml
@@ -130,8 +130,8 @@
<commons-collections4.version>4.5.0</commons-collections4.version>
<commons-compress.version>1.28.0</commons-compress.version>
<commons-io.version>2.22.0</commons-io.version>
- <commons-lang.version>2.6</commons-lang.version>
<commons-lang3.version>3.20.0</commons-lang3.version>
+ <commons-text.version>1.14.0</commons-text.version>
<commons-logging.version>1.3.6</commons-logging.version>
<commons-math3.version>3.6.1</commons-math3.version>
@@ -202,11 +202,6 @@
<artifactId>commons-cli</artifactId>
<version>${commons-cli.version}</version>
</dependency>
- <dependency>
- <groupId>commons-lang</groupId>
- <artifactId>commons-lang</artifactId>
- <version>${commons-lang.version}</version>
- </dependency>
<dependency>
<groupId>commons-io</groupId>
<artifactId>commons-io</artifactId>
@@ -217,6 +212,11 @@
<artifactId>commons-lang3</artifactId>
<version>${commons-lang3.version}</version>
</dependency>
+ <dependency>
+ <groupId>org.apache.commons</groupId>
+ <artifactId>commons-text</artifactId>
+ <version>${commons-text.version}</version>
+ </dependency>
<dependency>
<groupId>commons-codec</groupId>
<artifactId>commons-codec</artifactId>