This is an automated email from the ASF dual-hosted git repository.
mawiesne pushed a change to branch
updates_sandbox_component_'summarizer'_to_be_compatible_with_latest_opennlp-tools_release
in repository https://gitbox.apache.org/repos/asf/opennlp-sandbox.git
discard bcc3c5d updates sandbox component 'summarizer' to be compatible with
latest opennlp-tools release
add 03aa30c migrate sandbox component 'nlp-utils' to Java 11 (#75)
add 6b8bc07
introduce-common-maven-module-structure-for-corpus-server-components (#74)
add 57438de migrate sandbox component 'caseditor-corpus-server-plugin' to
Java 11 (#77)
add b4ac48e Introduce common parent pom for all 'opennlp-sandbox'
components (#79)
add fa15c58 Updates maven.yaml to fix deprecation warnings
add 40ff5f2 updates sandbox component 'opennlp-dl' to be compatible with
latest opennlp-tools release
add ff0e667 updates sandbox component 'summarizer' to be compatible with
latest opennlp-tools release
This update added new revisions after undoing existing revisions.
That is to say, some revisions that were in the old version of the
branch are not in the new version. This situation occurs
when a user --force pushes a change and generates a repository
containing something like this:
* -- * -- B -- O -- O -- O (bcc3c5d)
\
N -- N -- N
refs/heads/updates_sandbox_component_'summarizer'_to_be_compatible_with_latest_opennlp-tools_release
(ff0e667)
You should already have received notification emails for all of the O
revisions, and so the following emails describe only the N revisions
from the common base, B.
Any revisions marked "omit" are not gone; other references still
refer to them. Any revisions marked "discard" are gone forever.
No new revisions were added by this update.
Summary of changes:
.gitattributes | 48 +
.github/CONTRIBUTING.md | 11 +
.github/PULL_REQUEST_TEMPLATE.md | 27 +
.github/workflows/maven.yml | 51 +
.gitignore | 8 +-
caseditor-corpus-server-plugin/pom.xml | 62 +-
.../caseditor/CorpusExplorerView.java | 17 +-
.../caseditor/CorpusServerCasEditorInput.java | 6 +-
.../caseditor/CorpusServerPlugin.java | 2 +
.../caseditor/DefaultCasDocumentProvider.java | 119 +-
.../corpus_server/caseditor/TaskQueueView.java | 12 +-
caseditor-opennlp-plugin/pom.xml | 20 +-
.../caseditor/util/ContainingConstraint.java | 144 +-
checkstyle.xml | 142 +
.../corpus_server/connector/CSCasConsumerTest.java | 59 -
.../connector/CSCollectionReaderTest.java | 77 -
corpus-server-impl/pom.xml | 155 -
.../corpus-server-connector}/desc/CSCasWriter.xml | 120 +-
.../desc/CSQueueCollectionReader.xml | 216 +-
.../desc/EngPersonNameFinderTrainerCPE.xml | 0
.../desc/EngTokenizerAndSentdetectCPE.xml | 0
.../desc/PersonNameFinderTrainer.xml | 0
.../desc/SentenceDetector.xml | 0
.../corpus-server-connector}/desc/Tokenizer.xml | 0
.../desc/TokenizerAndSentdetectAAE.xml | 0
.../corpus-server-connector}/pom.xml | 67 +-
.../corpus_server/connector/CSCasWriter.java | 5 +-
.../connector/CSQueueCollectionReader.java | 2 +-
.../opennlp/corpus_server/connector/UimaUtil.java | 3 +-
.../corpus_server/connector/AbstractCSTest.java | 38 +-
.../corpus_server/connector/CSCasWriterTest.java | 84 +
.../connector/CSCollectionReaderTest.java | 112 +
.../corpus_server/connector}/TestCorpusServer.java | 4 +-
.../test/resources/CSCasConsumerTestDescriptor.xml | 2 +-
.../resources/CSCollectionReaderTestDescriptor.xml | 2 +-
.../src/test/resources}/TypeSystem.xml | 0
corpus-server/{ => corpus-server-core}/feature.xml | 4 +-
corpus-server/corpus-server-core/pom.xml | 120 +
.../opennlp/corpus_server/CorporaResource.java | 10 +-
.../opennlp/corpus_server/CorpusResource.java | 0
.../apache/opennlp/corpus_server/CorpusServer.java | 6 +-
.../corpus_server/CorpusServerApplication.java | 0
.../opennlp/corpus_server/CorpusServerBundle.java | 0
.../opennlp/corpus_server/TaskQueueResource.java | 0
.../opennlp/corpus_server/TaskQueuesResource.java | 0
.../corpus_server/search/SearchService.java | 0
.../corpus_server/store/AbstractCorporaStore.java | 2 +-
.../corpus_server/store/CorporaChangeListener.java | 0
.../opennlp/corpus_server/store/CorporaStore.java | 8 +-
.../opennlp/corpus_server/store/CorpusStore.java | 0
.../corpus_server/store/MemoryCorporaStore.java | 10 +-
.../corpus_server/store/MemoryCorpusStore.java | 0
.../corpus_server/taskqueue/MemoryTaskQueue.java | 0
.../taskqueue/MemoryTaskQueueService.java | 0
.../opennlp/corpus_server/taskqueue/TaskQueue.java | 0
.../corpus_server/taskqueue/TaskQueueService.java | 0
.../corpus_server/search}/IndexWriter.properties | 0
.../opennlp/corpus_server/search/LuceneIndexer.xml | 0
.../opennlp/corpus_server/search/TypeSystem.xml | 0
.../src/main/webapp/WEB-INF/web.xml | 0
.../corpus_server/util/TestCorpusServer.java | 0
.../corpus-server-impl}/feature.xml | 4 +-
.../corpus-server-impl}/pom.xml | 96 +-
.../opennlp/corpus_server/impl/Activator.java | 2 +-
.../corpus_server/impl/CorpusServerImpl.java | 7 +-
.../corpus_server/impl/DerbyCorporaStore.java | 106 +-
.../corpus_server/impl/DerbyCorpusStore.java | 13 +-
.../opennlp/corpus_server/impl/LuceneIndexer.java | 0
.../corpus_server/impl/LuceneSearchService.java | 6 +-
.../opennlp/corpus_server/impl/UimaUtil.java | 0
.../corpus_server/impl}/IndexWriter.properties | 0
.../opennlp/corpus_server/impl/LuceneIndexer.xml | 0
.../opennlp/corpus_server/impl/TypeSystem.xml | 0
.../corpus-server-tools}/bin/cs-tools | 0
.../corpus-server-tools}/pom.xml | 44 +-
.../opennlp/corpus_server/tools/CASImporter.java | 0
.../opennlp/corpus_server/tools/CorpusBackup.java | 0
.../opennlp/corpus_server/tools/CreateCorpus.java | 0
.../corpus_server/tools/CreateTaskQueue.java | 0
.../opennlp/corpus_server/tools/DropCorpus.java | 0
.../opennlp/corpus_server/tools/FileUtil.java | 0
.../opennlp/corpus_server/tools/RemoveCAS.java | 0
.../corpus_server/tools/ReplaceTypeSystem.java | 0
.../opennlp/corpus_server/tools/SearchCorpus.java | 0
corpus-server/pom.xml | 258 +-
mahout-addon/pom.xml | 17 +-
mallet-addon/pom.xml | 16 +-
modelbuilder-addon/pom.xml | 133 +-
.../modelbuilder/DefaultModelBuilderUtil.java | 230 +-
.../addons/modelbuilder/KnownEntityProvider.java | 84 +-
.../modelbuilder/ModelGenerationValidator.java | 60 +-
.../addons/modelbuilder/ModelParameter.java | 48 +-
.../opennlp/addons/modelbuilder/Modelable.java | 84 +-
.../modelbuilder/SemiSupervisedModelGenerator.java | 48 +-
.../addons/modelbuilder/SentenceProvider.java | 48 +-
.../modelbuilder/impls/BaseModelBuilderParams.java | 176 +-
.../impls/FileKnownEntityProvider.java | 150 +-
.../modelbuilder/impls/FileModelValidatorImpl.java | 188 +-
.../modelbuilder/impls/FileSentenceProvider.java | 140 +-
.../modelbuilder/impls/GenericModelGenerator.java | 208 +-
.../modelbuilder/impls/GenericModelableImpl.java | 256 +-
nlp-utils/pom.xml | 26 +-
.../anomalydetection/AnomalyDetectionUtils.java | 7 +-
.../org/apache/opennlp/utils/cfg/CFGBuilder.java | 2 +-
.../org/apache/opennlp/utils/cfg/CFGRunner.java | 265 +-
.../opennlp/utils/cfg/ContextFreeGrammar.java | 8 +-
.../utils/cfg/ProbabilisticContextFreeGrammar.java | 22 +-
.../classification/SimpleNaiveBayesClassifier.java | 27 +-
.../UpdatableSimpleNaiveBayesClassifier.java | 24 +-
.../opennlp/utils/languagemodel/LanguageModel.java | 12 +-
.../languagemodel/NaiveSentenceLanguageModel.java | 4 +-
.../opennlp/utils/languagemodel/NoisyChannel.java | 4 +-
.../TrigramSentenceLanguageModel.java | 2 +-
.../org/apache/opennlp/utils/ngram/NGramUtils.java | 6 +-
.../utils/regression/GradientDescentUtils.java | 2 +-
.../opennlp/utils/regression/Hypothesis.java | 2 +-
.../regression/LinearCombinationHypothesis.java | 2 +-
.../utils/regression/RegressionModelUtils.java | 32 +-
.../java/org/apache/opennlp/utils/TestUtils.java | 8 +-
.../AnomalyDetectionUtilsTest.java | 5 +-
.../SimpleNaiveBayesClassifierTest.java | 6 +-
.../NaiveSentenceLanguageModelTest.java | 16 +-
.../TrigramSentenceLanguageModelTest.java | 19 +-
.../apache/opennlp/utils/ngram/NGramUtilsTest.java | 12 +-
.../utils/regression/GradientDescentUtilsTest.java | 2 +-
.../utils/regression/RegressionModelUtilsTest.java | 13 +-
opennlp-coref/pom.xml | 14 +-
opennlp-dl/pom.xml | 242 +-
.../src/main/java/opennlp/tools/dl/DataReader.java | 26 +-
.../main/java/opennlp/tools/dl/GlobalVectors.java | 41 +-
.../main/java/opennlp/tools/dl/NameFinderDL.java | 32 +-
.../tools/dl/NameSampleDataSetIterator.java | 19 +-
.../main/java/opennlp/tools/dl/NeuralDocCat.java | 35 +-
.../java/opennlp/tools/dl/NeuralDocCatModel.java | 57 +-
.../java/opennlp/tools/dl/NeuralDocCatTrainer.java | 73 +-
opennlp-dl/src/main/java/opennlp/tools/dl/RNN.java | 39 +-
.../src/main/java/opennlp/tools/dl/StackedRNN.java | 52 +-
.../opennlp/tools/dl/UnclosableInputStream.java | 26 +-
.../src/test/java/opennlp/tools/dl/RNNTest.java | 15 +-
.../test/java/opennlp/tools/dl/StackedRNNTest.java | 25 +-
opennlp-similarity/README.txt | 276 +-
opennlp-similarity/RELEASE_NOTES.html | 152 +-
opennlp-similarity/pom.xml | 895 +-
.../multithreaded/BingWebQueryRunnerThread.java | 108 +-
.../apps/contentgen/multithreaded/Fragment.java | 176 +-
.../apps/contentgen/multithreaded/MyEvent.java | 22 +-
.../contentgen/multithreaded/MyEventListener.java | 16 +-
.../contentgen/multithreaded/cgRequestForm.html | 74 +-
.../multithreaded/nlProg2codeRequestForm.html | 94 +-
.../apps/object_dedup/SimilarityAccessorBase.java | 1476 +-
.../apps/relevanceVocabs/PhraseProcessor.java | 464 +-
.../apps/relevanceVocabs/SynonymListFilter.java | 206 +-
.../tools/apps/relevanceVocabs/SynonymMap.java | 704 +-
.../BingAPIProductSearchManager.java | 136 +-
.../review_builder/FBOpenGraphSearchManager.java | 282 +-
.../review_builder/MachineTranslationWrapper.java | 172 +-
.../review_builder/MinedSentenceProcessor.java | 418 +-
.../apps/review_builder/ReviewBuilderRunner.java | 330 +-
.../tools/apps/review_builder/ReviewObj.java | 274 +-
.../review_builder/SentenceBeingOriginalized.java | 118 +-
.../apps/review_builder/SentenceOriginalizer.java | 796 +-
.../URLsWithReviewFinderByProductName.java | 42 +-
.../review_builder/WebPageReviewExtractor.java | 872 +-
.../tools/apps/utils/email/EmailSender.java | 342 +-
.../tools/apps/utils/email/SMTP_Authenticator.java | 48 +-
.../ClassifierTrainingSetIndexer.java | 516 +-
.../java/opennlp/tools/fca/BasicLevelMetrics.java | 1300 +-
.../java/opennlp/tools/fca/ConceptLattice.java | 570 +-
.../main/java/opennlp/tools/fca/FcaConverter.java | 144 +-
.../src/main/java/opennlp/tools/fca/FcaReader.java | 190 +-
.../src/main/java/opennlp/tools/fca/FcaWriter.java | 262 +-
.../main/java/opennlp/tools/fca/FormalConcept.java | 302 +-
.../src/main/java/opennlp/tools/fca/Measures.java | 294 +-
.../opennlp/tools/fca/RandomNoiseGenerator.java | 124 +-
.../jsmlearning/FeatureSpaceCoverageProcessor.java | 630 +-
.../tools/jsmlearning/IntersectionSetBuilder.java | 722 +-
.../tools/jsmlearning/JSMLearnerOnLatticeBase.java | 676 +-
.../JSMLearnerOnLatticeWithAbduction.java | 174 +-
.../JSMLearnerOnLatticeWithDeduction.java | 484 +-
.../tools/jsmlearning/ProfileReaderWriter.java | 326 +-
.../tools/jsmlearning/TreeKernelRunner.java | 256 +-
.../main/java/opennlp/tools/nl2code/NL2Obj.java | 600 +-
.../opennlp/tools/nl2code/NL2ObjCreateAssign.java | 506 +-
.../opennlp/tools/nl2code/ObjectControlOp.java | 118 +-
.../java/opennlp/tools/nl2code/ObjectPhrase.java | 248 +-
.../tools/nl2code/ObjectPhraseListForSentence.java | 206 +-
.../java/opennlp/tools/parse_thicket/ArcType.java | 106 +-
.../opennlp/tools/parse_thicket/IGeneralizer.java | 24 +-
.../opennlp/tools/parse_thicket/ParseTreeNode.java | 472 +-
.../java/opennlp/tools/parse_thicket/Triple.java | 96 +-
.../WordWordInterSentenceRelationArc.java | 136 +-
.../BingQueryRunnerMultipageSearchResults.java | 144 +-
.../parse_thicket/apps/MinedSentenceProcessor.java | 418 +-
.../apps/MostFrequentWordsFromPageGetter.java | 140 +-
.../apps/MultiSentenceSearchResultsProcessor.java | 370 +-
.../parse_thicket/apps/SnippetToParagraph.java | 756 +-
.../apps/WebPageContentSentenceExtractor.java | 294 +-
.../tools/parse_thicket/apps/WebPageExtractor.java | 316 +-
.../CommunicativeActionsArcBuilder.java | 322 +-
.../CommunicativeActionsAttribute.java | 58 +-
.../parse_thicket/matching/LemmaGeneralizer.java | 188 +-
.../matching/NERPhraseGeneralizer.java | 542 +-
.../parse_thicket/matching/PhraseGeneralizer.java | 536 +-
.../matching/PhraseGroupGeneralizer.java | 230 +-
.../LinguisticPatternStructure.java | 388 +-
.../pattern_structure/PatternStructureWriter.java | 116 +-
.../pattern_structure/PhraseConcept.java | 168 +-
.../pattern_structure/PhrasePatternStructure.java | 384 +-
.../tools/similarity/apps/BingQueryRunner.java | 396 +-
.../tools/similarity/apps/BingResponse.java | 204 +-
.../tools/similarity/apps/BingWebQueryRunner.java | 230 +-
.../tools/similarity/apps/ContentGenerator.java | 850 +-
.../similarity/apps/ContentGeneratorRunner.java | 192 +-
.../similarity/apps/ContentGeneratorSupport.java | 984 +-
.../opennlp/tools/similarity/apps/Fragment.java | 194 +-
.../apps/GeneratedSentenceProcessor.java | 630 +-
.../opennlp/tools/similarity/apps/HitBase.java | 520 +-
.../tools/similarity/apps/HitBaseComparable.java | 52 +-
.../similarity/apps/RelatedSentenceFinder.java | 1928 +-
.../similarity/apps/RelatedSentenceFinderML.java | 574 +-
.../similarity/apps/SearchResultsProcessor.java | 226 +-
.../similarity/apps/SentenceTranslate.java.txt | 422 +-
.../apps/SpeechRecognitionResultsProcessor.java | 338 +-
.../similarity/apps/StoryDiscourseNavigator.java | 326 +-
.../apps/WebSearchEngineResultsScraper.java | 516 +-
.../tools/similarity/apps/YahooAnswersMiner.java | 188 +-
.../java/opennlp/tools/similarity/apps/gen.txt | 110 +-
.../tools/similarity/apps/solr/Comment.java | 222 +-
.../tools/similarity/apps/solr/CommentsRel.java | 256 +-
.../apps/solr/ContentGeneratorRequestHandler.java | 482 +-
.../apps/solr/IterativeQueryComponent.java | 374 +-
.../apps/solr/IterativeSearchRequestHandler.java | 678 +-
.../apps/solr/NLProgram2CodeRequestHandler.java | 178 +-
.../apps/solr/QueryExpansionRequestHandler.java | 104 +-
.../solr/SearchResultsReRankerRequestHandler.java | 456 +-
.../apps/solr/SyntGenRequestHandler.java | 646 +-
.../tools/similarity/apps/solr/WordDocBuilder.java | 496 +-
.../apps/solr/WordDocBuilderEndNotes.java | 422 +-
.../solr/WordDocBuilderSingleImageSearchCall.java | 330 +-
.../tools/similarity/apps/solr/cgRequestForm.html | 314 +-
.../similarity/apps/taxo_builder/AriAdapter.java | 186 +-
.../apps/taxo_builder/DomainTaxonomyExtender.java | 458 +-
.../taxo_builder/TaxoQuerySnapshotMatcher.java | 322 +-
.../taxo_builder/TaxonomyExtenderViaMebMining.java | 374 +-
.../apps/taxo_builder/TaxonomySerializer.java | 264 +-
.../similarity/apps/utils/CountItemsList.java | 126 +-
.../tools/similarity/apps/utils/FileHandler.java | 770 +-
.../apps/utils/LevensteinDistanceFinder.java | 290 +-
.../tools/similarity/apps/utils/PageFetcher.java | 304 +-
.../tools/similarity/apps/utils/StringCleaner.java | 58 +-
.../apps/utils/StringDistanceMeasurer.java | 660 +-
.../opennlp/tools/similarity/apps/utils/Utils.java | 1440 +-
.../tools/similarity/apps/utils/ValueSortMap.java | 572 +-
.../main/java/opennlp/tools/stemmer/PStemmer.java | 1034 +-
.../textsimilarity/EpistemicStatesTrainingSet.java | 226 +-
.../textsimilarity/GeneralizationListReducer.java | 300 +-
.../opennlp/tools/textsimilarity/LemmaPair.java | 162 +-
.../opennlp/tools/textsimilarity/POSManager.java | 130 +-
.../tools/textsimilarity/ParseTreeChunk.java | 1140 +-
.../textsimilarity/ParseTreeChunkComparable.java | 64 +-
.../tools/textsimilarity/ParseTreeMatcher.java | 508 +-
.../ParseTreeMatcherDeterministic.java | 550 +-
.../textsimilarity/SentencePairMatchResult.java | 200 +-
.../tools/textsimilarity/TextProcessor.java | 1908 +-
.../textsimilarity/TextSimilarityBagOfWords.java | 1786 +-
.../chunker2matcher/ParserCacheSerializer.java | 296 +-
.../java/opennlp/tools/textsimilarity/readme.txt | 270 +-
.../tools/word2vec/W2VDistanceMeasurer.java | 7 +-
opennlp-similarity/src/main/readme/LICENSE | 458 +-
opennlp-similarity/src/main/readme/NOTICE | 18 +-
.../MultiSentenceSearchResultsProcessorTest.java | 142 +-
.../apps/RelatedSentenceFinderTest.java | 280 +-
.../apps/StoryDiscourseNavigatorTest.java | 78 +-
.../pattern_structure/JSMLearnerOnLatticeTest.java | 616 +-
.../pattern_structure/PhraseTest.java | 338 +-
.../apps/SearchResultsProcessorTest.java | 112 +-
.../apps/taxo_builder/TaxonomyBuildMatchTest.java | 108 +-
.../ParserChunker2MatcherProcessorTest.java | 270 +-
.../chunker2matcher/PhraseNodeTest.java | 120 +-
.../src/test/resources/fca/sports.cxt | 110 +-
.../test/resources/style_recognizer/all-tsne2.txt | 1051 -
.../txt/Bib1/27Bib1Amos_Prophecy_12_EN.txt.txt | 2 -
.../txt/Bib1/28Bib1Amos_Prophecy_89_EN.txt.txt | 2 -
.../txt/Bib1/29Bib1Ezra_History_12_EN.txt.txt | 2 -
.../txt/Bib1/30Bib1Joel_Prophecy_12_EN.txt.txt | 2 -
.../txt/Bib1/31Bib1Ruth_History_12_EN.txt.txt | 2 -
.../txt/Bib2/32Bib2John_Gospel_12_EN.txt.txt | 2 -
.../txt/Bib2/33Bib2Jude_Epistle_1_EN.txt.txt | 2 -
.../txt/Bib2/34Bib2Luke_Acts_12_EN.txt.txt | 2 -
.../txt/Bib2/35Bib2Luke_Acts_2728_EN.txt.txt | 2 -
.../txt/Bib2/36Bib2Luke_Gospel_12_EN.txt.txt | 2 -
.../txt/Bib2/37Bib2Mark_Gospel_12_EN.txt.txt | 2 -
.../txt/Corp/38CorpApple_Environment_EN.txt.txt | 2 -
.../txt/Corp/39CorpHandM_Quality_EN.txt.txt | 2 -
.../txt/Corp/40CorpHandM_Responsibility_EN.txt.txt | 2 -
.../txt/Corp/41CorpHP_Objectives_EN.txt.txt | 2 -
.../Corp/42CorpJaguar_Sustainability_EN.txt.txt | 2 -
.../txt/Corp/43CorpZara_Environment_EN.txt.txt | 2 -
.../txt/Fict/44FictAndersenH_Mermaid_EN.txt.txt | 2 -
.../txt/Fict/45FictAndersenH_Ugly_EN.txt.txt | 2 -
.../txt/Fict/46FictBalzacH_Goriot_Ia_EN.txt.txt | 2 -
.../txt/Fict/47FictBalzacH_Goriot_Ib_EN.txt.txt | 2 -
.../txt/Fict/48FictBronteC_JaneEyre_33_EN.txt.txt | 2 -
.../txt/Fict/49FictBronteC_JaneEyre_6_EN.txt.txt | 2 -
.../Fict/50FictCarrollL_Wonderland_2_EN.txt.txt | 2 -
.../Fict/51FictCarrollL_Wonderland_5_EN.txt.txt | 2 -
.../Fict/52FictDostoyevskyF_CrimePun_ep_EN.txt.txt | 2 -
.../53FictDostoyevskyF_CrimePun_II2_EN.txt.txt | 2 -
.../txt/Fict/54FictDumasAp_3Musk_11_EN.txt.txt | 2 -
.../txt/Fict/55FictDumasAp_3Musk_2_EN.txt.txt | 2 -
.../txt/Fict/56FictFlaubertG_Bovary_I5_EN.txt.txt | 2 -
.../Fict/57FictFlaubertG_Bovary_III3_EN.txt.txt | 2 -
.../Fict/58FictFlaubertG_Salammbo_11_EN.txt.txt | 2 -
.../txt/Fict/59FictFlaubertG_Salammbo_2_EN.txt.txt | 2 -
.../txt/Fict/60FictGrimmJ_Bremusicians_EN.txt.txt | 2 -
.../txt/Fict/61FictGrimmJ_HanselGretel_EN.txt.txt | 2 -
.../txt/Fict/62FictHugoV_Hunchback_II5_EN.txt.txt | 2 -
.../txt/Fict/63FictHugoV_Hunchback_IV3_EN.txt.txt | 2 -
.../txt/Fict/64FictPoeE_Purloined_EN.txt.txt | 2 -
.../txt/Fict/65FictPoeE_Usher_EN.txt.txt | 2 -
.../txt/Fict/66FictTolstoyL_AnnaK_I10_EN.txt.txt | 2 -
.../txt/Fict/67FictTolstoyL_AnnaK_I11_EN.txt.txt | 2 -
.../Fict/68FictTolstoyL_WarPeace_I16_EN.txt.txt | 2 -
.../txt/Fict/69FictTolstoyL_WarPeace_I2_EN.txt.txt | 2 -
.../txt/Fict/70FictWildeO_Dorian_18_EN.txt.txt | 2 -
.../txt/Fict/71FictWildeO_Dorian_8_EN.txt.txt | 2 -
.../txt/Fict/72FictZolaE_Germinal_II4_EN.txt.txt | 2 -
.../txt/Fict/73FictZolaE_Germinal_VII2_EN.txt.txt | 2 -
.../txt/Marx/74MarxMarxK_ComMan_01_EN.txt.txt | 2 -
.../txt/Marx/75MarxMarxK_ComMan_24_EN.txt.txt | 2 -
.../txt/Marx/76MarxMarxK_Feuerbach_EN.txt.txt | 2 -
.../txt/Marx/77MarxMarxK_GothaProg_EN.txt.txt | 2 -
.../txt/Marx/78MarxMarxK_JewishQ_EN.txt.txt | 2 -
...o.uk_international_story_0,,631931,00.html.txt" | 2 -
...ews.bbc.co.uk_2_hi_middle_east_5136988.stm.txt" | 2 -
...ws.bbc.co.uk_2_hi_asia-pacific_2181151.stm.txt" | 2 -
...__news.bbc.co.uk_2_hi_business_2235352.stm.txt" | 2 -
...p:__money.guardian.co.uk_news__0,,,00.html.txt" | 2 -
...dian.co.uk_Match_Report_0,,1536875,00.html.txt" | 2 -
...ws.bbc.co.uk_2_hi_asia-pacific_5133220.stm.txt" | 2 -
...p:__news.bbc.co.uk_2_hi_europe_4263426.stm.txt" | 2 -
...__news.bbc.co.uk_2_hi_business_2769931.stm.txt" | 2 -
...c.co.uk_2_hi_uk_news_education_2191422.stm.txt" | 2 -
...p:__news.bbc.co.uk_2_hi_africa_2909769.stm.txt" | 2 -
...:__news.bbc.co.uk_2_hi_uk_news_2509561.stm.txt" | 2 -
.../txt/News/79NewsEnnajiM_Maghreb_EN.txt.txt | 2 -
.../txt/News/80NewsGoalcom_MessiTop50_EN.txt.txt | 2 -
.../txt/News/81NewsGueyeA_BlackPete_EN.txt.txt | 2 -
.../News/82NewsLeM_OrbanGoldmanSachs_EN.txt.txt | 2 -
...NewsMendesFrancoJ_HaitiBeyondCapital_EN.txt.txt | 2 -
.../84NewsMillerH_FrankensteinTradition_EN.txt.txt | 2 -
.../News/85NewsRabinovichI_IranNuclear_EN.txt.txt | 2 -
.../txt/News/86NewsRian_IranCutsOil_EN.txt.txt | 2 -
.../News/87NewsRian_MedvedevDismisses_EN.txt.txt | 2 -
.../txt/News/88NewsWiki_KaradzicArrest_EN.txt.txt | 2 -
.../txt/Opac/89OpacStallman_FreeSoft_EN.txt.txt | 2 -
.../txt/Opac/90OpacTeam_Berlin_EN.txt.txt | 2 -
.../txt/Opac/91OpacTeam_Budapest_EN.txt.txt | 2 -
.../txt/Tedi/100TediOConnellA_Quantum_EN.txt.txt | 2 -
.../txt/Tedi/101TediRoslingH_Poverty_EN.txt.txt | 2 -
.../Tedi/102TediSinclairC_OpenArchitech_EN.txt.txt | 2 -
.../Tedi/92TediAndersonEt_NuclearEnergy_EN.txt.txt | 2 -
.../txt/Tedi/93TediBelcherA_Batteries_EN.txt.txt | 2 -
.../txt/Tedi/94TediGellMannM_Lang_EN.txt.txt | 2 -
.../txt/Tedi/95TediJakubowskiM_OpenTech_EN.txt.txt | 2 -
.../txt/Tedi/96TediJordanC_ShockStats_EN.txt.txt | 2 -
.../txt/Tedi/97TediMcKeanE_Dict_EN.txt.txt | 2 -
.../txt/Tedi/98TediMillerA_News_EN.txt.txt | 2 -
.../txt/Tedi/99TediNatchweyJ_WarPhotos_EN.txt.txt | 2 -
.../txt/Tele/103TeleHTC_Manual_0_EN.txt.txt | 2 -
.../txt/Tele/104TeleHTC_Manual_10_EN.txt.txt | 2 -
.../txt/Tele/105TeleHTC_Manual_11_EN.txt.txt | 2 -
.../txt/Tele/106TeleHTC_Manual_12_EN.txt.txt | 2 -
.../txt/Tele/107TeleHTC_Manual_13_EN.txt.txt | 2 -
.../txt/Tele/108TeleHTC_Manual_1_EN.txt.txt | 2 -
.../txt/Tele/109TeleHTC_Manual_2_EN.txt.txt | 2 -
.../txt/Tele/110TeleHTC_Manual_3_EN.txt.txt | 2 -
.../txt/Tele/111TeleHTC_Manual_4_EN.txt.txt | 2 -
.../txt/Tele/112TeleHTC_Manual_5_EN.txt.txt | 2 -
.../txt/Tele/113TeleHTC_Manual_6_EN.txt.txt | 2 -
.../txt/Tele/114TeleHTC_Manual_7_EN.txt.txt | 2 -
.../txt/Tele/115TeleHTC_Manual_8_EN.txt.txt | 2 -
.../txt/Tele/116TeleHTC_Manual_9_EN.txt.txt | 2 -
.../txt/Teli/117TeliApple_iPhone4_EN.txt.txt | 2 -
.../txt/Tels/118TelsGoog_Answer_0545_EN.txt.txt | 2 -
.../txt/Tels/119TelsGoog_Answer_0a46_EN.txt.txt | 2 -
.../txt/Tels/120TelsGoog_Answer_0bcf_EN.txt.txt | 2 -
.../txt/Tels/121TelsGoog_Answer_1851_EN.txt.txt | 2 -
.../txt/Tels/122TelsGoog_Answer_1b37_EN.txt.txt | 2 -
.../txt/Tels/123TelsGoog_Answer_2feb_EN.txt.txt | 2 -
.../txt/Tels/124TelsGoog_Answer_3024_EN.txt.txt | 2 -
.../txt/Tels/125TelsGoog_Answer_4b5b_EN.txt.txt | 2 -
.../txt/Tels/126TelsGoog_Answer_596f_EN.txt.txt | 2 -
.../txt/Tels/127TelsGoog_Answer_5b4c_EN.txt.txt | 2 -
.../txt/Tels/128TelsGoog_Answer_70d7_EN.txt.txt | 2 -
.../txt/Tels/129TelsGoog_Answer_770f_EN.txt.txt | 2 -
.../txt/Tels/130TelsGoog_Answer_91e4_EN.txt.txt | 2 -
.../txt/Tels/131TelsGoog_Answer_94d0_EN.txt.txt | 2 -
.../txt/Tels/132TelsGoog_Answer_a67e_EN.txt.txt | 2 -
.../Unit/133UnitGass_Resolution_62250_EN.txt.txt | 2 -
.../txt/Unit/134UnitUnat_Charter_EN.txt.txt | 2 -
.../txt/Unit/135UnitUnat_HumanRights_EN.txt.txt | 2 -
.../txt/Unit/136UnitUnat_StatuteICOJ_EN.txt.txt | 2 -
...37WindParaschivoiuEt_DarrieusTurbine_EN.txt.txt | 2 -
.../txt/Wind/138WindPurohitEt_CDMIndia_EN.txt.txt | 2 -
...9WindRiadhEt_ContrarotatingConverter_EN.txt.txt | 2 -
...bacte\" url=\"http:__vue.org.uk_carlos.htm.txt" | 2 -
...rchived_game.asp?MatchID=89&Season=2002_03.txt" | 2 -
...scathoholidays.co.uk_ShowDetails.asp?id=96.txt" | 2 -
...onenews.org.uk_news_news_detail.asp?nid=22.txt" | 2 -
...\" url=\"http:__www.benhs.org.uk_anex.html.txt" | 2 -
...ion_guides_guides.php?subject=ratsthatbite.txt" | 2 -
...vices_selected_cases_PCA_sc9903_c682b.html.txt" | 2 -
....mml.cam.ac.uk_call_translation_toolkit_6_.txt" | 2 -
....uk_nnr-scotland_news_detail.asp?newsID=79.txt" | 2 -
...x.ac.uk_Conferences_BPCSR05_submission.htm.txt" | 2 -
...24.co.uk_flatfiles_paulpearcetributes.aspx.txt" | 2 -
...ckpresence.co.uk_phpBB2_viewtopic.php?t=97.txt" | 2 -
...viploan.co.uk_article_Mortgages-1212.shtml.txt" | 2 -
...:__www.brainbashers.co.uk_droodlesprev.asp.txt" | 2 -
...hotonics.org.uk_newsletter_NoticeBoard.php.txt" | 2 -
...l=\"http:__www.snh.org.uk_calendar_jul.asp.txt" | 2 -
...obs_Northamptonshire_jobs-in-Brackley.html.txt" | 2 -
..._ultimatefilm_chart_details.php?ranking=65.txt" | 2 -
...mms.co.uk_online_pr_online_pr.ehtml?o=1647.txt" | 2 -
...ackling_human_organ_donation_dilemma_.html.txt" | 2 -
...:__www.sscs.bham.ac.uk_phsi_eating_bmi.htm.txt" | 2 -
...s_selected_cases_HSC_IC0107_pt1-e2242.html.txt" | 2 -
...ce.org.uk_index.asp?contentid=21&menuid=21.txt" | 2 -
...jyhd\" url=\"http:__www.ebe.org.uk_ccn.htm.txt" | 2 -
...orthumberland.gov.uk_vg_text_northpen.html.txt" | 2 -
...rch_reports_1992_theatre_museum_index.html.txt" | 2 -
...eb.easynet.co.uk_jim.shead_River-Arun.html.txt" | 2 -
....lawson-cruttenden.co.uk_conveyancing.html.txt" | 2 -
...hamradio.co.uk_acatalog_Vert_Arno_Ant.html.txt" | 2 -
...ndependent.co.uk_europe_article1192096.ece.txt" | 2 -
...l=\"http:__www.nsbapty.co.uk_Supp-Samp.htm.txt" | 2 -
...x?&cp=.._swt_&cg=_&sim=&id=487&pagetype=27.txt" | 2 -
...http:__www.surf4wine.co.uk_Eben_Sadie.html.txt" | 2 -
...2D08%2D10+09%3A45%3A00&Logo=0&sort=cp&pg=1.txt" | 2 -
...w.ecodyfi.org.uk_commfirstactionplanpr.htm.txt" | 2 -
..." url=\"http:__www.sefton.gov.uk_page&3630.txt" | 2 -
...rspective.org.uk_dwboard_messages_112.html.txt" | 2 -
...dforsale-investment.org.uk_Plot-Sales.html.txt" | 2 -
...tcardirectory.co.uk_car-leasing-jamjar.htm.txt" | 2 -
...rl=\"http:__www.nta.nhs.uk_news_020624.htm.txt" | 2 -
...ity.ac.uk_law_lawpages_Victim_Support.html.txt" | 2 -
...ndustrialnetworking.co.uk_mag_v7-2_p7.html.txt" | 2 -
...ex.php?location=_news_archive_20040628.htm.txt" | 2 -
...ttp:__www.idler.co.uk_archives_?page_id=18.txt" | 2 -
...host.co.uk_support_index.pl?page=mailboxes.txt" | 2 -
...ws_archives_2005_11_backstagebbccou_2.html.txt" | 2 -
...twork.co.uk_Health_default.asp?article=135.txt" | 2 -
...arningexperience.org.uk_learning_first.php.txt" | 2 -
...chortle.co.uk_edfest2006_terrysaunders.htm.txt" | 2 -
....cps.gov.uk_legal_section21_chapter_f.html.txt" | 2 -
...:__www.tropicalfishcentre.co.uk_Plants.htm.txt" | 2 -
...ba.org.uk_bba_jsp_polopoly.jsp?d=155&a=493.txt" | 2 -
...tp:__www.burpham.surrey.sch.uk_potter.html.txt" | 2 -
...goryId=14542&taggingType=4&contentId=11208.txt" | 2 -
...d.co.uk_catalogue_walker_walkerreviews.htm.txt" | 2 -
...ripreports_Spain_andalucia6_and-oct-03.htm.txt" | 2 -
...gservicesindex.co.uk_newsletter_aug04.html.txt" | 2 -
...ndex.cfm?fuseaction=details&nNewsID=560539.txt" | 2 -
...o.uk_artists_artistspage.php?ID=204&page=3.txt" | 2 -
...ewire.co.uk_buying-property-continent.html.txt" | 2 -
...ion.co.uk_usability_articles_print_wud.asp.txt" | 2 -
...cabi_3736cbd2e5895cf49854f8d70494bae7.html.txt" | 2 -
...lsham.pwp.blueyonder.co.uk_cx500_oil_pump_.txt" | 2 -
...uk_index.php?name=News&file=article&sid=34.txt" | 2 -
...tel.org.uk_scgn_articles_9902_inbrief.html.txt" | 2 -
...side.gov.uk_tmbc6_cycling_withoutmycar.htm.txt" | 2 -
...f_Personal_pages_Ifan1_Booth_Notebooks.htm.txt" | 2 -
...ticle_3603_reduce-cancer-reoccurrence.html.txt" | 2 -
...eaddiscovery.co.uk_job.aspx?jid=11535&cd=1.txt" | 2 -
...:__www.syscom.plc.uk_solutions_distrib.asp.txt" | 2 -
...splay.jsp?section=Banking&article_id=64923.txt" | 2 -
....evolutec.co.uk_06_chairman.asp?thesub=6.0.txt" | 2 -
...www.truststfc.co.uk_meeting_27_09_2006.php.txt" | 2 -
...ansition_personal_experiences_michael.html.txt" | 2 -
...ary_library_history_library_history_3.html.txt" | 2 -
...cialistunitynetwork.co.uk_news_g8jepps.htm.txt" | 2 -
...ttp:__www.weirdwiltshire.co.uk_250703.html.txt" | 2 -
...y-midwifery_lsa-guidelines_maternal-deaths.txt" | 2 -
...kin+Ltd&frmBPE=&frmCD=N&mopt=dpe&dpid=2302.txt" | 2 -
...el\" url=\"http:__www.siba.co.uk_about.asp.txt" | 2 -
...s_Wave_Nirvana_2_Mizuno_Running_Shoes.html.txt" | 2 -
...research.org.uk_?lid=1944&tmpl=ddmainprint.txt" | 2 -
...uk_departments_services_campusenvironment_.txt" | 2 -
...e_details.asp?ED=Arts+and+Crafts&offset=66.txt" | 2 -
...vert_DBID_17ea4c66d7bd2c0aeb4513c89cb01afd.txt" | 2 -
...www.fst.rdg.ac.uk_news-archive-2004-11.htm.txt" | 2 -
...p:__www.aslib.co.uk_training_careers_9.htm.txt" | 2 -
...06_profile_Can-I-spend-time-on-an-elective.txt" | 2 -
....incomesdata.co.uk_europe_duediligence.htm.txt" | 2 -
....pennine.demon.co.uk_NPC_1982_MEXICOSP.HTM.txt" | 2 -
...http:__www.hsl.gov.uk_publications_car.htm.txt" | 2 -
..._www.baronage.co.uk_bphtm-01_const-02.html.txt" | 2 -
...55D14C83960FBA06562FFBA3B67013B5558FE96AD7.txt" | 2 -
...ww.myleedsjobs.co.uk_jobdetails-11834.html.txt" | 2 -
...http:__www.paperairplanes.co.uk_orplan.php.txt" | 2 -
...rl=\"http:__www.eca.ac.uk_tacitus_news.htm.txt" | 2 -
...ww.casino-avenue.co.uk_2004_06_duuuuh.html.txt" | 2 -
...ov.uk_lifeevent_penret_penreform_5_reg.asp.txt" | 2 -
...ramearch.co.uk_projects_T5_excavation.html.txt" | 2 -
...__www.redcross.org.uk_section.asp?id=49633.txt" | 2 -
...stforum.org.uk_jobs_forestsmonitor2001.htm.txt" | 2 -
...useum.org.uk_kids_detail.asp?ContentID=189.txt" | 2 -
...ffthetelly.co.uk_interviews_markwright.htm.txt" | 2 -
...tp:__www.sitcom.co.uk_tlc_characters.shtml.txt" | 2 -
...-grampian.co.uk_whiskycountry_ess_walk.htm.txt" | 2 -
...enparty.org.uk_sgpnewsarticle20051222a.htm.txt" | 2 -
....employment-solicitors.co.uk_Employer1.htm.txt" | 2 -
....co.uk_news_Food_Sounds_So_Good_at_DArcys_.txt" | 2 -
...\"http:__www.sweetsforu.co.uk_shipping.php.txt" | 2 -
...e.org.uk_Listings.aspx?index=387&item=2929.txt" | 2 -
....co.uk_product.aspx?catno=53&prod=HCAA6241.txt" | 2 -
....co.uk_main_en_att-provider-ROMA_6913.html.txt" | 2 -
...w.art-works.org.uk_artworks_z030703b.shtml.txt" | 2 -
...ndolier_booth_miscellaneous_wristgang.html.txt" | 2 -
..._www.changingdiabetes.co.uk_view.asp?ID=92.txt" | 2 -
...elmets.co.uk_las%20new%20bionix%20page.htm.txt" | 2 -
...age=37&sql=&sortup=sorttitle&bookstatus=OK.txt" | 2 -
...st.org.uk_cheshire_proj_harvest_survey.htm.txt" | 2 -
....enemydown.co.uk_clancomments.php?id=35113.txt" | 2 -
...http:__www.scis.org.uk_search_menu_new.asp.txt" | 2 -
...clickbankmembership_clickbankprotector.htm.txt" | 2 -
...w.blewa.co.uk_project5_teachers_T5-0-1.htm.txt" | 2 -
..._index.php?category=campaigns&c=i&uid=2130.txt" | 2 -
...__www.kent-ccc.co.uk_news_story.php?id=660.txt" | 2 -
...ault.asp?WCI=SiteHome&ID=9908&PageID=56638.txt" | 2 -
...o.uk_jsp_id_0340894342_Divine_Madness.html.txt" | 2 -
...ttp:__www.newble.co.uk_chalmers_innes.html.txt" | 2 -
...www.searchenginespy.co.uk_article0027.html.txt" | 2 -
...corpus_search_document.php?documentid=1211.txt" | 2 -
...amilyheritage_forum_topic.asp?TOPIC_ID=26&.txt" | 2 -
...rtyandhousesforsalelimousinabn0509263.html.txt" | 2 -
...rvicedevelopment_managerialfacilities.aspx.txt" | 2 -
..._safety_various_rass_kmweb_safety_msds.htm.txt" | 2 -
...itain.co.uk_index.php?id=23&L=3&article=13.txt" | 2 -
..._strAreaNo=1053,2011&strKeyword=PS2006_4_3.txt" | 2 -
..."http:__www.itreviews.co.uk_games_g232.htm.txt" | 2 -
...on.co.uk_2002_09_to-quote-the-four-seasons.txt" | 2 -
...fault.aspx?group_id=16538&article_id=21979.txt" | 2 -
...esearch_staff_jpf_papers_paper26_index.php.txt" | 2 -
...p:__www.all-energy.co.uk_newsletter45.html.txt" | 2 -
...tworker.org.uk_article.php?article_id=8138.txt" | 2 -
...www.setdanceteacher.co.uk_newmarketmez.htm.txt" | 2 -
....uk_interpro_DisplayIproEntry?ac=IPR002824.txt" | 2 -
...:__www.garthyfog.co.uk_mawddach_valley.htm.txt" | 2 -
...k_caving_expeditions_jura05_jura_circ1.php.txt" | 2 -
....oca-online.co.uk_viewnews.cfm?news_id=177.txt" | 2 -
...ustomPage.aspx?PageID=24163§ionID=4585.txt" | 2 -
...usnews_news_search.php?search=&start=12080.txt" | 2 -
...ww.linc4info.org.uk_cms_pages_sitemap.html.txt" | 2 -
...www.ccp4.ac.uk_courses_IUCr2005_index.html.txt" | 2 -
...ptive-engineering.co.uk_html_training.html.txt" | 2 -
...bc\" url=\"http:__www.lanpac.co.uk_csi.php.txt" | 2 -
...le.org.uk_html_files_501_project_info.html.txt" | 2 -
...ures.co.uk_showpage.asp?showdocumentid=196.txt" | 2 -
....rl.ac.uk_star_docs_sun232.htx_node17.html.txt" | 2 -
...900_cmhansrd_vo000405_debtext_00405-07.htm.txt" | 2 -
...20PRESBYTERY%20OF%20PENPONT%20p.%20672.htm.txt" | 2 -
..._www.wessingtoncryogenics.co.uk_serv01.htm.txt" | 2 -
...vdc_content_index.jsp?contentid=1999276669.txt" | 2 -
...w.stratford-upon-avon.co.uk_static_481.htm.txt" | 2 -
...rgygroup.co.uk_office-support-recruitment_.txt" | 2 -
..._catalog_product_info.php?products_id=2981.txt" | 2 -
....uk_fourwheels_formula1_article.asp?a=1327.txt" | 2 -
...david_docs_api_javax_swing_JSplitPane.html.txt" | 2 -
...ateonline.co.uk_60_66_67_articles_7335.php.txt" | 2 -
...__www.iae.co.uk_news_designedforthejob.htm.txt" | 2 -
...rg.uk_Case_Studies_studies_Ford3_Ford3.asp.txt" | 2 -
...tcoffee.co.uk_product.php?xProd=21&xSec=22.txt" | 2 -
...uk_usability_aboutus_usability_aboutus.asp.txt" | 2 -
...orld_story.asp?latestchapter=12&subarea=11.txt" | 2 -
...rratt.co.uk_pages_searchdetails.asp?ID=776.txt" | 2 -
...lthforum.org.uk_userpage1.cfm?item_id=1913.txt" | 2 -
...w.schoolhouse.org.uk_law_not_enrolled.html.txt" | 2 -
..._calendar_archive_article.cfm?articleId=52.txt" | 2 -
..."http:__www.lathes.co.uk_beaver_page5.html.txt" | 2 -
...__www.hasslefreeminiatures.co.uk_rules.php.txt" | 2 -
...g.uk_modules_event_viewevent.php?eveid=109.txt" | 2 -
...ube-cheats_Gamecube-(hardware)-Cheats.html.txt" | 2 -
...:__www.omega.co.uk_ppt_pptsc.asp?ref=LE902.txt" | 2 -
..._forum_poster.cfm?sort=creatasc&poster=101.txt" | 2 -
...org.uk_directory_prof_issues_blreview.html.txt" | 2 -
...rged_to_back_london's_olympic_2012_bid.htm.txt" | 2 -
...?forum=106&thread=9757638&message=11724737.txt" | 2 -
...10051_20553_100_10012_10010_category_10010.txt" | 2 -
...jhc.co.uk_news_industry_2005_ind505016.htm.txt" | 2 -
...ww.uea.ac.uk_eas_events_litfestspr04.shtml.txt" | 2 -
...w.kimberry.co.uk_Dotnetlectures_Index.aspx.txt" | 2 -
...www.lathes.co.uk_wolfjahnmiller_page2.html.txt" | 2 -
..._site_cms_newsarticleview.asp?article=2173.txt" | 2 -
...\"http:__www.anweb.co.uk_l_04_c3_c3a10.htm.txt" | 2 -
...nt_subject_modernlanguages_course_s1s2.htm.txt" | 2 -
...http:__www.law.warwick.ac.uk_ltj_4-1m.html.txt" | 2 -
...zenshipfoundation.org.uk_main_news.php?n20.txt" | 2 -
...\"http:__www.arnside-online.co.uk_care.htm.txt" | 2 -
...rsport.co.uk_products_leatherman_micra.php.txt" | 2 -
....org.uk_columnists_docdiary2.php?docId=103.txt" | 2 -
...nline.co.uk_article_articleview_1733_1_153.txt" | 2 -
...ird-survey.pwp.blueyonder.co.uk_P_mugo.htm.txt" | 2 -
...www.free-internet.co.uk_email_sendmail.htm.txt" | 2 -
...k_resources_ums_PythonDoc_api_threads.html.txt" | 2 -
...html?in_article_id=405873&in_page_id=50002.txt" | 2 -
...gservices.gcal.ac.uk_synergy_03_scwbl.html.txt" | 2 -
...les_BF_NEWSART_view.asp?Q=BF_NEWSART_95582.txt" | 2 -
...oftware.co.uk_printpage.asp?REF=_group.asp.txt" | 2 -
...tp:__www.dba.org.uk_aboutdba_chriswood.asp.txt" | 2 -
...k_culture_books_0804_110804_food_books.htm.txt" | 2 -
...p:__www.newtsnni.gov.uk_actionplan_04b.htm.txt" | 2 -
...ICT_KS3_databases_relational_databases.htm.txt" | 2 -
...erton_pages_SchemesofWork_KS4_skillswl.htm.txt" | 2 -
...r-men_unusual-gadgets_mood-light-tile.html.txt" | 2 -
...rticle&sid=175&mode=thread&order=0&thold=0.txt" | 2 -
...l=\"http:__www.engender.org.uk_justice.htm.txt" | 2 -
...ttp:__www.heros.org.uk_home_sub.asp?page=2.txt" | 2 -
...g.org.uk_clinical_prac_mar_05_mar05_08.htm.txt" | 2 -
...__www.cdp.bham.ac.uk_About_CDP_methods.htm.txt" | 2 -
...o.uk_caminfo_blueprint_articles.asp?ID=807.txt" | 2 -
...legislation_scotland_acts2002_20017--b.htm.txt" | 2 -
...ictures.co.uk_dog-pictures_shiba_inu.shtml.txt" | 2 -
...trawbale-building.co.uk_index.php?page=faq.txt" | 2 -
...er.co.uk_londonunderuk_tfl_our_careers.asp.txt" | 2 -
...:__www.environment.bham.ac.uk_extindex.htm.txt" | 2 -
...xhibitions_Aug%2006%2004_James%20Cauty.htm.txt" | 2 -
...tp:__www.sincuser.f9.co.uk_050_lastwrd.htm.txt" | 2 -
...tp:__www.ocdaction.org.uk_skin-picking.htm.txt" | 2 -
...l=\"http:__www.greenparty.org.uk_news_2033.txt" | 2 -
...el.ed.ac.uk_linguist_issues_17_17-229.html.txt" | 2 -
...news_aRelease.asp?akey=2026&Mon=01_07_2004.txt" | 2 -
..." url=\"http:__www.lpt.nhs.uk_service5.php.txt" | 2 -
...org.uk_resources_reportdetails.asp?id=1039.txt" | 2 -
....arctech.co.uk_siemens_hosted_exchange.htm.txt" | 2 -
...g.uk_archives_2006_01_chomsky_intervi.html.txt" | 2 -
.../synd/0syndicate_bmw-s-and-chinese-justice.txt | 2 -
.../synd/10syndicate_france-s-fourth-moment.txt | 2 -
...-wrong-idea-of-france-by-brigitte-granville.txt | 2 -
.../12syndicate_hollywood-s-favorite-villains.txt | 2 -
...icate_japanese-lessons-for-china-s-currency.txt | 2 -
...terrence-from-cuba-to-iran-by-joseph-s--nye.txt | 2 -
...15syndicate_merkel-in-china-by-sanjaya-baru.txt | 2 -
.../16syndicate_ms--europe-or-frau-germania-.txt | 2 -
...-supply-chain-by-andrew-sheng-and-geng-xiao.txt | 2 -
...icate_russia-s-ukrainian-path-to-the-future.txt | 2 -
...uld-europe-regulate-sovereign-wealth-funds-.txt | 2 -
...1syndicate_china-and-a-new-balance-of-power.txt | 2 -
...dicate_the--browning--of-african-technology.txt | 2 -
.../txt/synd/21syndicate_the-china-question.txt | 2 -
...yndicate_the-end-of-the-russia-china-debate.txt | 2 -
...ndicate_the-making-of-china-s-trade-deficit.txt | 2 -
...cate_the-return-of-franco-german-leadership.txt | 2 -
.../synd/25syndicate_the-transatlantic-index.txt | 2 -
.../26syndicate_will-russia-save-the-west-.txt | 2 -
..._china-and-russia-in-the-new-world-disorder.txt | 2 -
...na-japan-protests-islands-by-liah-greenfeld.txt | 2 -
.../txt/synd/4syndicate_china-s-cyber-warriors.txt | 2 -
.../txt/synd/5syndicate_china-s-gift-to-europe.txt | 2 -
.../synd/6syndicate_china-s-threat-to-russia.txt | 2 -
...pe-s-vital-french-connection-by-kemal-dervi.txt | 2 -
.../txt/synd/8syndicate_exchange-rate-disorder.txt | 2 -
...ndicate_france-and-germany-must-act-in-iraq.txt | 2 -
...140ted_a_j_jacobs_year_of_living_biblically.txt | 2 -
...alan_kay_shares_a_powerful_idea_about_ideas.txt | 2 -
...2ted_alex_tabarrok_foresees_economic_growth.txt | 2 -
.../txt/ted/143ted_amy_tan_on_creativity.txt | 2 -
...ted_barry_schwartz_on_the_paradox_of_choice.txt | 2 -
..._benjamin_wallace_on_the_price_of_happiness.txt | 2 -
.../146ted_bono_s_call_to_action_for_africa.txt | 2 -
.../147ted_dan_dennett_cute_sexy_sweet_funny.txt | 2 -
...invents_a_better_way_to_harvest_bone_marrow.txt | 2 -
...makes_his_ted_prize_wish_once_upon_a_school.txt | 2 -
.../150ted_don_norman_on_design_and_emotion.txt | 2 -
...ns_goodwin_on_learning_from_past_presidents.txt | 2 -
...ed_elliot_krane_the_mystery_of_chronic_pain.txt | 2 -
...eva_zeisel_on_the_playful_search_for_beauty.txt | 2 -
...d_ex_moonie_diane_benscoter_how_cults_think.txt | 2 -
.../txt/ted/155ted_hans_rosling_at_state.txt | 2 -
...ted_helen_fisher_tells_us_why_we_love_cheat.txt | 2 -
...57ted_isabel_allende_tells_tales_of_passion.txt | 2 -
.../158ted_jessi_arrington_wearing_nothing_new.txt | 2 -
...n_underkoffler_drive_3d_data_with_a_gesture.txt | 2 -
...ed_joseph_lekuton_tells_a_parable_for_kenya.txt | 2 -
.../txt/ted/161ted_julia_sweeney_has_the_talk.txt | 2 -
...d_ken_robinson_says_schools_kill_creativity.txt | 2 -
.../txt/ted/163ted_marcin_jakubowski.txt | 2 -
...oach_10_things_you_didn_t_know_about_orgasm.txt | 2 -
...el_sandel_the_lost_art_of_democratic_debate.txt | 2 -
...michael_shermer_on_believing_strange_things.txt | 2 -
...a_glenny_investigates_global_crime_networks.txt | 2 -
..._what_hallucination_reveals_about_our_minds.txt | 2 -
...ebecca_saxe_how_brains_make_moral_judgments.txt | 2 -
.../ted/170ted_robert_thurman_on_compassion.txt | 2 -
...rory_sutherland_life_lessons_from_an_ad_man.txt | 2 -
...2ted_sean_gourley_on_the_mathematics_of_war.txt | 2 -
...hows_how_he_found_the_true_face_of_leonardo.txt | 2 -
...en_wolfram_computing_a_theory_of_everything.txt | 2 -
.../txt/ted/175ted_tom_wujec_build_a_tower.txt | 2 -
...m_wujec_on_3_ways_the_brain_creates_meaning.txt | 2 -
.../style_recognizer/txt/ted/177ted_william_li.txt | 2 -
...company-wizard.co.uk_SEO_Link-Exchange.htm.txt" | 2 -
...ip.org.uk_newspub_story.cfm?id=353&sid=123.txt" | 2 -
...aringconcern.org.uk_news_news_scots06.html.txt" | 2 -
...ogy_in_the_Community_Joan_Wolstenholme.htm.txt" | 2 -
...ault.asp?WCI=SiteHome&ID=4337&PageID=21591.txt" | 2 -
...galha.freeserve.co.uk_glh_233_mckenna.html.txt" | 2 -
.../txt/un/A/178un_A_AC252_L13.txt | 2 -
.../txt/un/A/179un_A_C3_61_L17.txt | 2 -
.../txt/un/A/180un_APLC_MSP2_2000_1.txt | 2 -
.../txt/un/C/181un_CCW_APII_CONF4_SR2.txt | 2 -
.../style_recognizer/txt/un/C/182un_CD_1605.txt | 2 -
.../style_recognizer/txt/un/C/183un_CD_1606.txt | 2 -
.../style_recognizer/txt/un/C/184un_CD_1672.txt | 2 -
.../style_recognizer/txt/un/C/185un_CD_PV1080.txt | 2 -
.../style_recognizer/txt/un/C/186un_CD_PV1157.txt | 2 -
.../style_recognizer/txt/un/C/187un_CD_PV857.txt | 2 -
.../style_recognizer/txt/un/C/188un_CD_PV861.txt | 2 -
.../txt/un/C/189un_CEDAW_C_2002_II_3_ADD2.txt | 2 -
.../txt/un/C/190un_CES_SEM52_2.txt | 2 -
.../txt/un/C/191un_CES_SEM52_3.txt | 2 -
.../style_recognizer/txt/un/C/192un_CLCS_34.txt | 2 -
.../txt/un/C/193un_CRC_GC_2003_4.txt | 2 -
.../style_recognizer/txt/un/D/194un_DP_2002_34.txt | 2 -
.../txt/un/E/195un_E_C16_2002_2.txt | 2 -
.../txt/un/E/196un_E_CN17_2002_PC2_19.txt | 2 -
.../txt/un/E/197un_E_CN3_2003_25.txt | 2 -
.../txt/un/E/198un_E_CN4_2003_G_12.txt | 2 -
.../txt/un/E/199un_E_CN4_2004_G_21.txt | 2 -
.../txt/un/F/200un_FCCC_SBI_2002_15.txt | 2 -
.../txt/un/F/201un_FCCC_SBI_2002_9.txt | 2 -
.../txt/un/F/202un_FCCC_SBI_2004_L27.txt | 2 -
.../txt/un/H/203un_HRI_CORE_1_ADD117.txt | 2 -
.../txt/un/H/204un_HRI_CORE_1_ADD123.txt | 2 -
.../txt/un/H/205un_HSP_GC_19_2_ADD2.txt | 2 -
.../style_recognizer/txt/un/I/206un_IDB25_6.txt | 2 -
.../style_recognizer/txt/un/I/207un_IDB35_13.txt | 2 -
.../style_recognizer/txt/un/I/208un_ISBA_8_A_1.txt | 2 -
.../txt/un/N/209un_NPT_CONF2005_PCI_10.txt | 2 -
.../txt/un/P/210un_PBC24_1_ADD1.txt | 2 -
.../txt/un/P/211un_PBC24_4-IDB35_4.txt | 2 -
.../txt/un/P/212un_PBC_2_SLE_9.txt | 2 -
.../txt/un/P/213un_PCNICC_2000_1_ADD1.txt | 2 -
.../txt/un/P/214un_PCNICC_2001_WGAPIC_L1.txt | 2 -
.../style_recognizer/txt/un/S/215un_S_2000_475.txt | 2 -
.../style_recognizer/txt/un/S/216un_S_2000_817.txt | 2 -
.../txt/un/S/217un_S_2001_1038-A_56_521.txt | 2 -
.../txt/un/S/218un_S_2001_1039.txt | 2 -
.../txt/un/S/219un_S_2001_1317.txt | 2 -
.../txt/un/S/220un_S_2001_70-A_55_740.txt | 2 -
.../style_recognizer/txt/un/S/221un_S_2001_947.txt | 2 -
.../txt/un/S/222un_S_2002_1141.txt | 2 -
.../txt/un/S/223un_S_2002_1180.txt | 2 -
.../txt/un/S/224un_S_2002_238-A_56_858.txt | 2 -
.../txt/un/S/225un_S_2002_313-A_56_888.txt | 2 -
.../txt/un/S/226un_S_2002_573-A_56_960.txt | 2 -
.../txt/un/S/227un_S_2003_326-A_ES-10_222.txt | 2 -
.../style_recognizer/txt/un/S/228un_S_2006_490.txt | 2 -
.../txt/un/S/229un_S_2009_208-A_63_820.txt | 2 -
.../txt/un/S/230un_SAICM_ICCM2_INF_18.txt | 2 -
.../style_recognizer/txt/un/S/231un_S_PV4596.txt | 2 -
.../style_recognizer/txt/un/S/232un_S_PV4646.txt | 2 -
.../txt/un/S/233un_S_PV4684RESUMPTION1.txt | 2 -
.../style_recognizer/txt/un/S/234un_S_PV4736.txt | 2 -
.../style_recognizer/txt/un/S/235un_S_PV4903.txt | 2 -
.../style_recognizer/txt/un/S/236un_S_PV4944.txt | 2 -
.../style_recognizer/txt/un/S/237un_S_PV5627.txt | 2 -
.../txt/un/S/238un_ST_SGB_2002_9.txt | 2 -
.../style_recognizer/txt/un/T/239un_TD_B_49_11.txt | 2 -
.../txt/un/T/240un_TD_B_49_SC2_L1.txt | 2 -
.../txt/un/T/241un_TD_B_COM3_54.txt | 2 -
.../txt/un/T/242un_TD_B_EX28_L1.txt | 2 -
.../txt/un/T/243un_TESTGVADUTY001.txt | 2 -
.../txt/un/U/244un_UNEP_GC_22_8_ADD2.txt | 2 -
.../txt/un/U/245un_UNEP_GC_24_2.txt | 2 -
.../txt/un/U/246un_UNEP_POPS_INC6_22.txt | 2 -
...stir.ac.uk_sppa_sppa_responsibilities.html.txt" | 2 -
...customer_terms_index.omp?cid=1146151223400.txt" | 2 -
...uk_Cmach_Backissues_j005_Articles_hall.htm.txt" | 2 -
...o.uk_archives_2006_06_met_chief_could.html.txt" | 2 -
...ttp:__www.fenews.co.uk_newsview.asp?n=1014.txt" | 2 -
...the_north_east_petscorner_news_140106.html.txt" | 2 -
..."http:__www.nursingbra.co.uk_emma_jane.htm.txt" | 2 -
...ive_care_worcestershire_easemore_road.html.txt" | 2 -
...o.uk_comedy_comedians_comedian.aspx?id=429.txt" | 2 -
...\"http:__www.seequality.org.uk_gender.html.txt" | 2 -
.../src/test/resources/taxonomies/irs_dom.ari | 3074 +-
.../src/test/resources/taxonomies/taxo_English.xml | 230202 +++++++++---------
.../resources/tree_kernel/action-plan-doc-list.csv | 119 -
.../src/test/resources/tree_kernel/svm.run.mac.zip | Bin 90804 -> 0 bytes
.../src/test/resources/tree_kernel/svm_classify | Bin 257356 -> 0 bytes
.../test/resources/tree_kernel/svm_classify.exe | Bin 136343 -> 0 bytes
.../test/resources/tree_kernel/svm_classify.linux | Bin 275767 -> 0 bytes
.../src/test/resources/tree_kernel/svm_learn | Bin 336068 -> 0 bytes
.../src/test/resources/tree_kernel/svm_learn.exe | Bin 147778 -> 0 bytes
.../tree_kernel/training_pos_neg_sentiment.txt | 15930 --
.../src/test/resources/tree_kernel/tree_kernel.zip | Bin 89535 -> 0 bytes
opennlp-wsd/pom.xml | 12 +-
.../DisambiguatorEvaluatorParams.java | 82 +-
.../disambiguator/DisambiguatorEvaluatorTool.java | 190 +-
.../cmdline/disambiguator/DisambiguatorTool.java | 274 +-
.../disambiguator/DisambiguatorToolParams.java | 82 +-
.../disambiguator/IMSWSDContextGenerator.java | 326 +-
.../disambiguator/IMSWSDSequenceValidator.java | 100 +-
.../main/java/opennlp/tools/disambiguator/MFS.java | 306 +-
.../disambiguator/OSCCWSDContextGenerator.java | 224 +-
.../tools/disambiguator/WSDContextGenerator.java | 68 +-
.../opennlp/tools/disambiguator/WSDHelper.java | 1386 +-
.../java/opennlp/tools/disambiguator/WSDModel.java | 308 +-
.../opennlp/tools/disambiguator/WSDSample.java | 452 +-
.../tools/disambiguator/WSDSampleStream.java | 156 +-
.../disambiguator/WSDisambiguatorFactory.java | 122 +-
.../tools/disambiguator/datareader/Paragraph.java | 194 +-
.../datareader/SemcorReaderExtended.java | 684 +-
.../disambiguator/datareader/SensevalReader.java | 610 +-
.../tools/disambiguator/datareader/Sentence.java | 174 +-
.../tools/disambiguator/datareader/Word.java | 598 +-
.../tools/disambiguator/MFSEvaluatorTest.java | 130 +-
.../opennlp/tools/disambiguator/MFSTester.java | 262 +-
pom.xml | 475 +
corpus-server-impl/feature.xml => rat-excludes | 21 +-
summarizer/pom.xml | 46 +-
.../main/java/opennlp/summarization/Sentence.java | 4 +-
.../lexicalchaining/LexicalChain.java | 3 +-
.../lexicalchaining/LexicalChainingSummarizer.java | 4 +-
.../WordRelationshipDetermination.java | 13 +-
.../preprocess/DefaultDocProcessor.java | 5 +-
.../opennlp/summarization/textrank/TextRank.java | 2 +-
summarizer/src/test/resources/wordnet/LICENSE | 31 -
summarizer/src/test/resources/wordnet/README | 101 -
summarizer/src/test/resources/wordnet/dict/adj.exc | 1490 -
summarizer/src/test/resources/wordnet/dict/adv.exc | 7 -
.../src/test/resources/wordnet/dict/data.adj | 18185 --
.../src/test/resources/wordnet/dict/data.adv | 3650 -
.../src/test/resources/wordnet/dict/data.noun | 82144 -------
.../src/test/resources/wordnet/dict/data.verb | 13796 --
.../src/test/resources/wordnet/dict/frames.vrb | 35 -
.../src/test/resources/wordnet/dict/index.adj | 21508 --
.../src/test/resources/wordnet/dict/index.adv | 4510 -
.../src/test/resources/wordnet/dict/index.noun | 117827 ---------
.../src/test/resources/wordnet/dict/index.sense | 206941 ----------------
.../src/test/resources/wordnet/dict/index.verb | 11558 -
.../src/test/resources/wordnet/dict/lexnames | 45 -
.../src/test/resources/wordnet/dict/noun.exc | 2054 -
.../src/test/resources/wordnet/dict/sentidx.vrb | 3421 -
.../src/test/resources/wordnet/dict/sents.vrb | 170 -
.../test/resources/wordnet/dict/verb.Framestext | 35 -
.../src/test/resources/wordnet/dict/verb.exc | 2401 -
tagging-server/pom.xml | 25 +-
tf-ner-poc/pom.xml | 9 +-
wikinews-importer/pom.xml | 9 +-
852 files changed, 150690 insertions(+), 657622 deletions(-)
create mode 100644 .gitattributes
create mode 100644 .github/CONTRIBUTING.md
create mode 100644 .github/PULL_REQUEST_TEMPLATE.md
create mode 100644 .github/workflows/maven.yml
create mode 100644 checkstyle.xml
delete mode 100644
corpus-server-connector/src/test/java/org/apache/opennlp/corpus_server/connector/CSCasConsumerTest.java
delete mode 100644
corpus-server-connector/src/test/java/org/apache/opennlp/corpus_server/connector/CSCollectionReaderTest.java
delete mode 100644 corpus-server-impl/pom.xml
rename {corpus-server-connector =>
corpus-server/corpus-server-connector}/desc/CSCasWriter.xml (97%)
rename {corpus-server-connector =>
corpus-server/corpus-server-connector}/desc/CSQueueCollectionReader.xml (97%)
rename {corpus-server-connector =>
corpus-server/corpus-server-connector}/desc/EngPersonNameFinderTrainerCPE.xml
(100%)
rename {corpus-server-connector =>
corpus-server/corpus-server-connector}/desc/EngTokenizerAndSentdetectCPE.xml
(100%)
rename {corpus-server-connector =>
corpus-server/corpus-server-connector}/desc/PersonNameFinderTrainer.xml (100%)
rename {corpus-server-connector =>
corpus-server/corpus-server-connector}/desc/SentenceDetector.xml (100%)
rename {corpus-server-connector =>
corpus-server/corpus-server-connector}/desc/Tokenizer.xml (100%)
rename {corpus-server-connector =>
corpus-server/corpus-server-connector}/desc/TokenizerAndSentdetectAAE.xml (100%)
rename {corpus-server-connector =>
corpus-server/corpus-server-connector}/pom.xml (63%)
rename {corpus-server-connector =>
corpus-server/corpus-server-connector}/src/main/java/org/apache/opennlp/corpus_server/connector/CSCasWriter.java
(96%)
rename {corpus-server-connector =>
corpus-server/corpus-server-connector}/src/main/java/org/apache/opennlp/corpus_server/connector/CSQueueCollectionReader.java
(99%)
rename {corpus-server-connector =>
corpus-server/corpus-server-connector}/src/main/java/org/apache/opennlp/corpus_server/connector/UimaUtil.java
(97%)
copy tf-ner-poc/src/main/java/org/apache/opennlp/ModelUtil.java =>
corpus-server/corpus-server-connector/src/test/java/org/apache/opennlp/corpus_server/connector/AbstractCSTest.java
(53%)
create mode 100644
corpus-server/corpus-server-connector/src/test/java/org/apache/opennlp/corpus_server/connector/CSCasWriterTest.java
create mode 100644
corpus-server/corpus-server-connector/src/test/java/org/apache/opennlp/corpus_server/connector/CSCollectionReaderTest.java
copy corpus-server/{src/test/java/org/apache/opennlp/corpus_server/util =>
corpus-server-connector/src/test/java/org/apache/opennlp/corpus_server/connector}/TestCorpusServer.java
(90%)
rename
corpus-server-connector/src/test/resources/org/apache/opennlp/corpus_server/connector/CSCasConsumerDescriptor.xml
=>
corpus-server/corpus-server-connector/src/test/resources/CSCasConsumerTestDescriptor.xml
(99%)
rename
corpus-server-connector/src/test/resources/org/apache/opennlp/corpus_server/connector/CSCollectionReaderDescriptor.xml
=>
corpus-server/corpus-server-connector/src/test/resources/CSCollectionReaderTestDescriptor.xml
(97%)
copy
{corpus-server-impl/src/main/resources/org/apache/opennlp/corpus_server/impl =>
corpus-server/corpus-server-connector/src/test/resources}/TypeSystem.xml (100%)
rename corpus-server/{ => corpus-server-core}/feature.xml (94%)
create mode 100644 corpus-server/corpus-server-core/pom.xml
rename corpus-server/{ =>
corpus-server-core}/src/main/java/org/apache/opennlp/corpus_server/CorporaResource.java
(92%)
rename corpus-server/{ =>
corpus-server-core}/src/main/java/org/apache/opennlp/corpus_server/CorpusResource.java
(100%)
rename corpus-server/{ =>
corpus-server-core}/src/main/java/org/apache/opennlp/corpus_server/CorpusServer.java
(89%)
rename corpus-server/{ =>
corpus-server-core}/src/main/java/org/apache/opennlp/corpus_server/CorpusServerApplication.java
(100%)
rename corpus-server/{ =>
corpus-server-core}/src/main/java/org/apache/opennlp/corpus_server/CorpusServerBundle.java
(100%)
rename corpus-server/{ =>
corpus-server-core}/src/main/java/org/apache/opennlp/corpus_server/TaskQueueResource.java
(100%)
rename corpus-server/{ =>
corpus-server-core}/src/main/java/org/apache/opennlp/corpus_server/TaskQueuesResource.java
(100%)
rename corpus-server/{ =>
corpus-server-core}/src/main/java/org/apache/opennlp/corpus_server/search/SearchService.java
(100%)
rename corpus-server/{ =>
corpus-server-core}/src/main/java/org/apache/opennlp/corpus_server/store/AbstractCorporaStore.java
(94%)
rename corpus-server/{ =>
corpus-server-core}/src/main/java/org/apache/opennlp/corpus_server/store/CorporaChangeListener.java
(100%)
rename corpus-server/{ =>
corpus-server-core}/src/main/java/org/apache/opennlp/corpus_server/store/CorporaStore.java
(86%)
rename corpus-server/{ =>
corpus-server-core}/src/main/java/org/apache/opennlp/corpus_server/store/CorpusStore.java
(100%)
rename corpus-server/{ =>
corpus-server-core}/src/main/java/org/apache/opennlp/corpus_server/store/MemoryCorporaStore.java
(93%)
rename corpus-server/{ =>
corpus-server-core}/src/main/java/org/apache/opennlp/corpus_server/store/MemoryCorpusStore.java
(100%)
rename corpus-server/{ =>
corpus-server-core}/src/main/java/org/apache/opennlp/corpus_server/taskqueue/MemoryTaskQueue.java
(100%)
rename corpus-server/{ =>
corpus-server-core}/src/main/java/org/apache/opennlp/corpus_server/taskqueue/MemoryTaskQueueService.java
(100%)
rename corpus-server/{ =>
corpus-server-core}/src/main/java/org/apache/opennlp/corpus_server/taskqueue/TaskQueue.java
(100%)
rename corpus-server/{ =>
corpus-server-core}/src/main/java/org/apache/opennlp/corpus_server/taskqueue/TaskQueueService.java
(100%)
rename
{corpus-server-impl/src/main/resources/org/apache/opennlp/corpus_server/impl =>
corpus-server/corpus-server-core/src/main/resources/org/apache/opennlp/corpus_server/search}/IndexWriter.properties
(100%)
rename corpus-server/{ =>
corpus-server-core}/src/main/resources/org/apache/opennlp/corpus_server/search/LuceneIndexer.xml
(100%)
rename corpus-server/{ =>
corpus-server-core}/src/main/resources/org/apache/opennlp/corpus_server/search/TypeSystem.xml
(100%)
rename corpus-server/{ => corpus-server-core}/src/main/webapp/WEB-INF/web.xml
(100%)
rename corpus-server/{ =>
corpus-server-core}/src/test/java/org/apache/opennlp/corpus_server/util/TestCorpusServer.java
(100%)
copy {corpus-server-impl => corpus-server/corpus-server-impl}/feature.xml (88%)
copy {tagging-server => corpus-server/corpus-server-impl}/pom.xml (60%)
rename {corpus-server-impl =>
corpus-server/corpus-server-impl}/src/main/java/org/apache/opennlp/corpus_server/impl/Activator.java
(98%)
rename {corpus-server-impl =>
corpus-server/corpus-server-impl}/src/main/java/org/apache/opennlp/corpus_server/impl/CorpusServerImpl.java
(98%)
rename {corpus-server-impl =>
corpus-server/corpus-server-impl}/src/main/java/org/apache/opennlp/corpus_server/impl/DerbyCorporaStore.java
(68%)
rename {corpus-server-impl =>
corpus-server/corpus-server-impl}/src/main/java/org/apache/opennlp/corpus_server/impl/DerbyCorpusStore.java
(96%)
rename {corpus-server-impl =>
corpus-server/corpus-server-impl}/src/main/java/org/apache/opennlp/corpus_server/impl/LuceneIndexer.java
(100%)
rename {corpus-server-impl =>
corpus-server/corpus-server-impl}/src/main/java/org/apache/opennlp/corpus_server/impl/LuceneSearchService.java
(98%)
rename {corpus-server-impl =>
corpus-server/corpus-server-impl}/src/main/java/org/apache/opennlp/corpus_server/impl/UimaUtil.java
(100%)
rename
corpus-server/{src/main/resources/org/apache/opennlp/corpus_server/search =>
corpus-server-impl/src/main/resources/org/apache/opennlp/corpus_server/impl}/IndexWriter.properties
(100%)
rename {corpus-server-impl =>
corpus-server/corpus-server-impl}/src/main/resources/org/apache/opennlp/corpus_server/impl/LuceneIndexer.xml
(100%)
rename {corpus-server-impl =>
corpus-server/corpus-server-impl}/src/main/resources/org/apache/opennlp/corpus_server/impl/TypeSystem.xml
(100%)
rename {corpus-server-tools => corpus-server/corpus-server-tools}/bin/cs-tools
(100%)
rename {corpus-server-tools => corpus-server/corpus-server-tools}/pom.xml (69%)
rename {corpus-server-tools =>
corpus-server/corpus-server-tools}/src/main/java/org/apache/opennlp/corpus_server/tools/CASImporter.java
(100%)
rename {corpus-server-tools =>
corpus-server/corpus-server-tools}/src/main/java/org/apache/opennlp/corpus_server/tools/CorpusBackup.java
(100%)
rename {corpus-server-tools =>
corpus-server/corpus-server-tools}/src/main/java/org/apache/opennlp/corpus_server/tools/CreateCorpus.java
(100%)
rename {corpus-server-tools =>
corpus-server/corpus-server-tools}/src/main/java/org/apache/opennlp/corpus_server/tools/CreateTaskQueue.java
(100%)
rename {corpus-server-tools =>
corpus-server/corpus-server-tools}/src/main/java/org/apache/opennlp/corpus_server/tools/DropCorpus.java
(100%)
rename {corpus-server-tools =>
corpus-server/corpus-server-tools}/src/main/java/org/apache/opennlp/corpus_server/tools/FileUtil.java
(100%)
rename {corpus-server-tools =>
corpus-server/corpus-server-tools}/src/main/java/org/apache/opennlp/corpus_server/tools/RemoveCAS.java
(100%)
rename {corpus-server-tools =>
corpus-server/corpus-server-tools}/src/main/java/org/apache/opennlp/corpus_server/tools/ReplaceTypeSystem.java
(100%)
rename {corpus-server-tools =>
corpus-server/corpus-server-tools}/src/main/java/org/apache/opennlp/corpus_server/tools/SearchCorpus.java
(100%)
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/all-tsne2.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Bib1/27Bib1Amos_Prophecy_12_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Bib1/28Bib1Amos_Prophecy_89_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Bib1/29Bib1Ezra_History_12_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Bib1/30Bib1Joel_Prophecy_12_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Bib1/31Bib1Ruth_History_12_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Bib2/32Bib2John_Gospel_12_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Bib2/33Bib2Jude_Epistle_1_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Bib2/34Bib2Luke_Acts_12_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Bib2/35Bib2Luke_Acts_2728_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Bib2/36Bib2Luke_Gospel_12_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Bib2/37Bib2Mark_Gospel_12_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Corp/38CorpApple_Environment_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Corp/39CorpHandM_Quality_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Corp/40CorpHandM_Responsibility_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Corp/41CorpHP_Objectives_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Corp/42CorpJaguar_Sustainability_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Corp/43CorpZara_Environment_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/44FictAndersenH_Mermaid_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/45FictAndersenH_Ugly_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/46FictBalzacH_Goriot_Ia_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/47FictBalzacH_Goriot_Ib_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/48FictBronteC_JaneEyre_33_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/49FictBronteC_JaneEyre_6_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/50FictCarrollL_Wonderland_2_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/51FictCarrollL_Wonderland_5_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/52FictDostoyevskyF_CrimePun_ep_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/53FictDostoyevskyF_CrimePun_II2_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/54FictDumasAp_3Musk_11_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/55FictDumasAp_3Musk_2_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/56FictFlaubertG_Bovary_I5_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/57FictFlaubertG_Bovary_III3_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/58FictFlaubertG_Salammbo_11_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/59FictFlaubertG_Salammbo_2_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/60FictGrimmJ_Bremusicians_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/61FictGrimmJ_HanselGretel_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/62FictHugoV_Hunchback_II5_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/63FictHugoV_Hunchback_IV3_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/64FictPoeE_Purloined_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/65FictPoeE_Usher_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/66FictTolstoyL_AnnaK_I10_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/67FictTolstoyL_AnnaK_I11_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/68FictTolstoyL_WarPeace_I16_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/69FictTolstoyL_WarPeace_I2_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/70FictWildeO_Dorian_18_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/71FictWildeO_Dorian_8_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/72FictZolaE_Germinal_II4_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Fict/73FictZolaE_Germinal_VII2_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Marx/74MarxMarxK_ComMan_01_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Marx/75MarxMarxK_ComMan_24_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Marx/76MarxMarxK_Feuerbach_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Marx/77MarxMarxK_GothaProg_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Marx/78MarxMarxK_JewishQ_EN.txt.txt
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/News/494news1\"
url=\"http:__observer.guardian.co.uk_international_story_0,,631931,00.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/News/495news2\"
url=\"http:__news.bbc.co.uk_2_hi_middle_east_5136988.stm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/News/496news3\"
url=\"http:__news.bbc.co.uk_2_hi_asia-pacific_2181151.stm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/News/497news4\"
url=\"http:__news.bbc.co.uk_2_hi_business_2235352.stm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/News/498news5\"
url=\"http:__money.guardian.co.uk_news__0,,,00.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/News/499news6\"
url=\"http:__football.guardian.co.uk_Match_Report_0,,1536875,00.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/News/500news7\"
url=\"http:__news.bbc.co.uk_2_hi_asia-pacific_5133220.stm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/News/501news8\"
url=\"http:__news.bbc.co.uk_2_hi_europe_4263426.stm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/News/502news9\"
url=\"http:__news.bbc.co.uk_2_hi_business_2769931.stm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/News/503newsa\"
url=\"http:__news.bbc.co.uk_2_hi_uk_news_education_2191422.stm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/News/504newsb\"
url=\"http:__news.bbc.co.uk_2_hi_africa_2909769.stm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/News/505newsc\"
url=\"http:__news.bbc.co.uk_2_hi_uk_news_2509561.stm.txt"
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/News/79NewsEnnajiM_Maghreb_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/News/80NewsGoalcom_MessiTop50_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/News/81NewsGueyeA_BlackPete_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/News/82NewsLeM_OrbanGoldmanSachs_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/News/83NewsMendesFrancoJ_HaitiBeyondCapital_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/News/84NewsMillerH_FrankensteinTradition_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/News/85NewsRabinovichI_IranNuclear_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/News/86NewsRian_IranCutsOil_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/News/87NewsRian_MedvedevDismisses_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/News/88NewsWiki_KaradzicArrest_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Opac/89OpacStallman_FreeSoft_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Opac/90OpacTeam_Berlin_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Opac/91OpacTeam_Budapest_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tedi/100TediOConnellA_Quantum_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tedi/101TediRoslingH_Poverty_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tedi/102TediSinclairC_OpenArchitech_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tedi/92TediAndersonEt_NuclearEnergy_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tedi/93TediBelcherA_Batteries_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tedi/94TediGellMannM_Lang_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tedi/95TediJakubowskiM_OpenTech_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tedi/96TediJordanC_ShockStats_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tedi/97TediMcKeanE_Dict_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tedi/98TediMillerA_News_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tedi/99TediNatchweyJ_WarPhotos_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tele/103TeleHTC_Manual_0_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tele/104TeleHTC_Manual_10_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tele/105TeleHTC_Manual_11_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tele/106TeleHTC_Manual_12_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tele/107TeleHTC_Manual_13_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tele/108TeleHTC_Manual_1_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tele/109TeleHTC_Manual_2_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tele/110TeleHTC_Manual_3_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tele/111TeleHTC_Manual_4_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tele/112TeleHTC_Manual_5_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tele/113TeleHTC_Manual_6_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tele/114TeleHTC_Manual_7_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tele/115TeleHTC_Manual_8_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tele/116TeleHTC_Manual_9_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Teli/117TeliApple_iPhone4_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tels/118TelsGoog_Answer_0545_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tels/119TelsGoog_Answer_0a46_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tels/120TelsGoog_Answer_0bcf_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tels/121TelsGoog_Answer_1851_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tels/122TelsGoog_Answer_1b37_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tels/123TelsGoog_Answer_2feb_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tels/124TelsGoog_Answer_3024_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tels/125TelsGoog_Answer_4b5b_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tels/126TelsGoog_Answer_596f_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tels/127TelsGoog_Answer_5b4c_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tels/128TelsGoog_Answer_70d7_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tels/129TelsGoog_Answer_770f_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tels/130TelsGoog_Answer_91e4_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tels/131TelsGoog_Answer_94d0_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Tels/132TelsGoog_Answer_a67e_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Unit/133UnitGass_Resolution_62250_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Unit/134UnitUnat_Charter_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Unit/135UnitUnat_HumanRights_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Unit/136UnitUnat_StatuteICOJ_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Wind/137WindParaschivoiuEt_DarrieusTurbine_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Wind/138WindPurohitEt_CDMIndia_EN.txt.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/Wind/139WindRiadhEt_ContrarotatingConverter_EN.txt.txt
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bact/311bacte\"
url=\"http:__vue.org.uk_carlos.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/baiw/312baiwc\"
url=\"http:__www.sleafordtownfc.co.uk_archives_archived_game.asp?MatchID=89&Season=2002_03.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bays/313baysn\"
url=\"http:__www.portscathoholidays.co.uk_ShowDetails.asp?id=96.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bbgk/314bbgkl\"
url=\"http:__www.homezonenews.org.uk_news_news_detail.asp?nid=22.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bbgl/315bbglz\"
url=\"http:__www.benhs.org.uk_anex.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bcke/316bcked\"
url=\"http:__www.fancy-rats.co.uk_information_guides_guides.php?subject=ratsthatbite.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bcnk/317bcnko\"
url=\"http:__www.ombudsman.org.uk_improving_services_selected_cases_PCA_sc9903_c682b.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bdac/318bdacj\"
url=\"http:__www.mml.cam.ac.uk_call_translation_toolkit_6_.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bdat/252bdat\"
url=\"http:__www.snh.org.uk_nnr-scotland_news_detail.asp?newsID=79.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bdrl/319bdrlk\"
url=\"http:__www.mubs.mdx.ac.uk_Conferences_BPCSR05_submission.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bdsv/320bdsvh\"
url=\"http:__www.herts24.co.uk_flatfiles_paulpearcetributes.aspx.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/belc/321belcb\"
url=\"http:__www.blackpresence.co.uk_phpBB2_viewtopic.php?t=97.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/beoe/322beoeg\"
url=\"http:__www.viploan.co.uk_article_Mortgages-1212.shtml.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bfqb/323bfqbt\"
url=\"http:__www.brainbashers.co.uk_droodlesprev.asp.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bgck/324bgckh\"
url=\"http:__www.photonics.org.uk_newsletter_NoticeBoard.php.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bgnd/325bgndn\"
url=\"http:__www.snh.org.uk_calendar_jul.asp.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bgpw/326bgpwt\"
url=\"http:__www.cv-library.co.uk_localjobs_Northamptonshire_jobs-in-Brackley.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bgvt/327bgvth\"
url=\"https:__secure.bfi.org.uk_features_ultimatefilm_chart_details.php?ranking=65.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bhdt/328bhdtl\"
url=\"http:__eurocomms.co.uk_online_pr_online_pr.ehtml?o=1647.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bhtu/329bhtur\"
url=\"http:__www.inverness-courier.co.uk_news_fullstory.php_aid_809_Tackling_human_organ_donation_dilemma_.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bhvh/330bhvhh\"
url=\"http:__www.sscs.bham.ac.uk_phsi_eating_bmi.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/biec/331bieca\"
url=\"http:__www.ombudsman.org.uk_improving_services_selected_cases_HSC_IC0107_pt1-e2242.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bjcq/332bjcqp\"
url=\"http:__www.bfice.org.uk_index.asp?contentid=21&menuid=21.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bjyh/333bjyhd\"
url=\"http:__www.ebe.org.uk_ccn.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bjzd/334bjzdi\"
url=\"http:__www.northumberland.gov.uk_vg_text_northpen.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bkeb/335bkebq\"
url=\"http:__www.vam.ac.uk_res_cons_research_research_reports_1992_theatre_museum_index.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bknb/336bknbk\"
url=\"http:__easyweb.easynet.co.uk_jim.shead_River-Arun.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bksu/337bksuh\"
url=\"http:__www.lawson-cruttenden.co.uk_conveyancing.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bkvb/338bkvbo\"
url=\"http:__www.hamradio.co.uk_acatalog_Vert_Arno_Ant.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bkxn/339bkxng\"
url=\"http:__travel.independent.co.uk_europe_article1192096.ece.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/blun/340blunb\"
url=\"http:__www.nsbapty.co.uk_Supp-Samp.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bmbk/341bmbka\"
url=\"http:__www.shakespeare-country.co.uk_swt.aspx?&cp=.._swt_&cg=_&sim=&id=487&pagetype=27.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bmwr/342bmwro\"
url=\"http:__www.surf4wine.co.uk_Eben_Sadie.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bnaq/343bnaqt\"
url=\"http:__jobsearch.localgov.monster.co.uk_getjob.asp?JobID=46663258&AVSDM=2006%2D08%2D10+09%3A45%3A00&Logo=0&sort=cp&pg=1.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bnqe/253bnqe\"
url=\"http:__www.ecodyfi.org.uk_commfirstactionplanpr.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bofv/254bofv\"
url=\"http:__www.sefton.gov.uk_page&3630.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bopl/344boplu\"
url=\"http:__www.dw-perspective.org.uk_dwboard_messages_112.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/botu/345botuf\"
url=\"http:__www.landforsale-investment.org.uk_Plot-Sales.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bova/346bovad\"
url=\"http:__www.expertcardirectory.co.uk_car-leasing-jamjar.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bped/347bpedf\"
url=\"http:__www.nta.nhs.uk_news_020624.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bpjo/348bpjoh\"
url=\"http:__www1.city.ac.uk_law_lawpages_Victim_Support.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bpsf/349bpsfu\"
url=\"http:__www.industrialnetworking.co.uk_mag_v7-2_p7.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bqbn/350bqbnl\"
url=\"http:__www.cedr.co.uk_index.php?location=_news_archive_20040628.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bqcc/351bqccv\"
url=\"http:__www.idler.co.uk_archives_?page_id=18.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bqsw/352bqswt\"
url=\"http:__www.donhost.co.uk_support_index.pl?page=mailboxes.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bqxq/353bqxqv\"
url=\"http:__backstage.bbc.co.uk_news_archives_2005_11_backstagebbccou_2.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/brcu/255brcu\"
url=\"http:__www.motheratwork.co.uk_Health_default.asp?article=135.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/brjy/354brjyh\"
url=\"http:__www.learningexperience.org.uk_learning_first.php.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bsaj/355bsajb\"
url=\"http:__www.chortle.co.uk_edfest2006_terrysaunders.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bspm/356bspmu\"
url=\"http:__www.cps.gov.uk_legal_section21_chapter_f.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bssg/357bssga\"
url=\"http:__www.tropicalfishcentre.co.uk_Plants.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/btab/358btabi\"
url=\"http:__www.bba.org.uk_bba_jsp_polopoly.jsp?d=155&a=493.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/btbb/359btbbg\"
url=\"http:__www.burpham.surrey.sch.uk_potter.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bthk/360bthkw\"
url=\"http:__www.ttrb.ac.uk_viewArticle.aspx?categoryId=14542&taggingType=4&contentId=11208.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bthx/361bthxs\"
url=\"http:__www.rvrcd.co.uk_catalogue_walker_walkerreviews.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/btlm/362btlmk\"
url=\"http:__www.birdtours.co.uk_tripreports_Spain_andalucia6_and-oct-03.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/btsm/363btsmp\"
url=\"http:__www.trainingservicesindex.co.uk_newsletter_aug04.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/btsx/364btsxl\"
url=\"http:__www.mediaweek.co.uk_search_index.cfm?fuseaction=details&nNewsID=560539.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/btvt/365btvti\"
url=\"http:__www.i-dj.co.uk_artists_artistspage.php?ID=204&page=3.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bukc/366bukcu\"
url=\"http:__www.ukpages.freewire.co.uk_buying-property-continent.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bvai/367bvaif\"
url=\"http:__www.uservision.co.uk_usability_articles_print_wud.asp.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bvha/368bvhab\"
url=\"http:__agrifor.ac.uk_browse_cabi_3736cbd2e5895cf49854f8d70494bae7.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bvqz/369bvqzk\"
url=\"http:__www.elsham.pwp.blueyonder.co.uk_cx500_oil_pump_.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bvxo/370bvxom\"
url=\"http:__www.schools.co.uk_index.php?name=News&file=article&sid=34.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bwal/371bwale\"
url=\"http:__www.poptel.org.uk_scgn_articles_9902_inbrief.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bwvh/372bwvhf\"
url=\"http:__www.tameside.gov.uk_tmbc6_cycling_withoutmycar.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bycu/373bycul\"
url=\"http:__www.mubs.mdx.ac.uk_Staff_Personal_pages_Ifan1_Booth_Notebooks.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/byeg/374byegq\"
url=\"http:__www.thehealthierlife.co.uk_article_3603_reduce-cancer-reoccurrence.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bykk/375bykkm\"
url=\"http:__jobs.leaddiscovery.co.uk_job.aspx?jid=11535&cd=1.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bynx/376bynxp\"
url=\"http:__www.syscom.plc.uk_solutions_distrib.asp.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bytv/377bytvq\"
url=\"http:__personalfinance.iii.co.uk_articles_articledisplay.jsp?section=Banking&article_id=64923.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bzam/378bzamy\"
url=\"http:__www.evolutec.co.uk_06_chairman.asp?thesub=6.0.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bzfk/379bzfki\"
url=\"http:__www.truststfc.co.uk_meeting_27_09_2006.php.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bzic/380bzicn\"
url=\"http:__www.macintyrecharity.org.uk_transition_personal_experiences_michael.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bziz/381bzizf\"
url=\"http:__union.ic.ac.uk_scc_icsf_library_library_history_library_history_3.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bzlq/382bzlqz\"
url=\"http:__www.socialistunitynetwork.co.uk_news_g8jepps.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bzor/383bzors\"
url=\"http:__www.weirdwiltshire.co.uk_250703.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bzsx/384bzsxn\"
url=\"http:__www.tsha.nhs.uk_modernising-healthcare-in-trent_the-local-supervising-authority-midwifery_lsa-guidelines_maternal-deaths.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/bzxm/385bzxmk\"
url=\"http:__www.buildingproductexpert.co.uk_ExpandedEntries_expandedentry.asp?cid=212046&cname=Mark+Simpkin+Ltd&frmBPE=&frmCD=N&mopt=dpe&dpid=2302.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cahe/386cahel\"
url=\"http:__www.siba.co.uk_about.asp.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cbfp/387cbfpd\"
url=\"https:__secure.advanceperformance.co.uk_acatalog_Men_s_Wave_Nirvana_2_Mizuno_Running_Shoes.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cbuk/388cbukt\"
url=\"http:__www.deafnessresearch.org.uk_?lid=1944&tmpl=ddmainprint.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cbxv/389cbxvh\"
url=\"http:__www.port.ac.uk_departments_services_campusenvironment_.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cckm/390cckmj\"
url=\"http:__www.dillington.co.uk_day_course_details.asp?ED=Arts+and+Crafts&offset=66.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/ccnl/256ccnl\"
url=\"http:__www.esporta.co.uk_Clubs_Mids+%26+East+Anglia_Oxford_Promotions_Member%27s+Forum_!+!_CLASS_Advert_DBID_17ea4c66d7bd2c0aeb4513c89cb01afd.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cdfc/391cdfcq\"
url=\"http:__www.fst.rdg.ac.uk_news-archive-2004-11.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cdng/392cdngg\"
url=\"http:__www.aslib.co.uk_training_careers_9.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cdqv/393cdqvl\"
url=\"http:__www.ncl.ac.uk_undergraduate_course_A106_profile_Can-I-spend-time-on-an-elective.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cedi/394cedie\"
url=\"http:__www.incomesdata.co.uk_europe_duediligence.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cegc/395cegcr\"
url=\"http:__www.pennine.demon.co.uk_NPC_1982_MEXICOSP.HTM.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/celp/396celpi\"
url=\"http:__www.hsl.gov.uk_publications_car.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cest/397cesta\"
url=\"http:__www.baronage.co.uk_bphtm-01_const-02.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cewp/398cewpo\"
url=\"http:__www.assureweb.co.uk_public_Main.asp?Params=65C5B21F70C4D12078C6116FD0FD01ED50A0B7BBFBEBBDC7F85DB3C8C41964AFCF3977972B54AAC68E8AE50A7AB1888C6DEE8379864B7E79F21CA9025DF7DD55D14C83960FBA06562FFBA3B67013B5558FE96AD7.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cfec/399cfecj\"
url=\"http:__www.myleedsjobs.co.uk_jobdetails-11834.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cfuh/400cfuhe\"
url=\"http:__www.paperairplanes.co.uk_orplan.php.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cfvq/401cfvqe\"
url=\"http:__www.eca.ac.uk_tacitus_news.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cfwj/402cfwje\"
url=\"http:__www.casino-avenue.co.uk_2004_06_duuuuh.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cfwt/403cfwtc\"
url=\"http:__www.dwp.gov.uk_lifeevent_penret_penreform_5_reg.asp.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cfxp/404cfxpi\"
url=\"http:__www.framearch.co.uk_projects_T5_excavation.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cgbz/405cgbzt\"
url=\"http:__www.redcross.org.uk_section.asp?id=49633.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cgel/406cgelv\"
url=\"http:__www.forestforum.org.uk_jobs_forestsmonitor2001.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cgjx/407cgjxf\"
url=\"http:__www.twickenham-museum.org.uk_kids_detail.asp?ContentID=189.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cgzy/257cgzy\"
url=\"http:__www.offthetelly.co.uk_interviews_markwright.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/chns/408chnsk\"
url=\"http:__www.sitcom.co.uk_tlc_characters.shtml.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/chny/409chnyq\"
url=\"http:__www.aberdeen-grampian.co.uk_whiskycountry_ess_walk.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cicu/410cicug\"
url=\"http:__www.shipleygreenparty.org.uk_sgpnewsarticle20051222a.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cipr/411ciprs\"
url=\"http:__www.employment-solicitors.co.uk_Employer1.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/citx/412citxq\"
url=\"http:__www.princessquare.co.uk_news_Food_Sounds_So_Good_at_DArcys_.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cjia/413cjiau\"
url=\"http:__www.sweetsforu.co.uk_shipping.php.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cjjc/414cjjcl\"
url=\"http:__www.e.volve.org.uk_Listings.aspx?index=387&item=2929.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cjqc/415cjqcv\"
url=\"http:__www.verko.co.uk_product.aspx?catno=53&prod=HCAA6241.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cjta/416cjtan\"
url=\"http:__www.romancesouthwest.co.uk_main_en_att-provider-ROMA_6913.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cjto/417cjton\"
url=\"http:__www.art-works.org.uk_artworks_z030703b.shtml.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cjtu/418cjtub\"
url=\"http:__www.jr2.ox.ac.uk_bandolier_booth_miscellaneous_wristgang.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cjwg/419cjwgx\"
url=\"http:__www.changingdiabetes.co.uk_view.asp?ID=92.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/ckcu/420ckcux\"
url=\"http:__www.lashelmets.co.uk_las%20new%20bionix%20page.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/ckiv/421ckivb\"
url=\"http:__www.cb-com.co.uk_listgen.asp?layout=results-brief.asp&page=37&sql=&sortup=sorttitle&bookstatus=OK.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/ckju/422ckjul\"
url=\"http:__www.wildlifetrust.org.uk_cheshire_proj_harvest_survey.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/ckrq/423ckrqy\"
url=\"http:__www.enemydown.co.uk_clancomments.php?id=35113.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/ckym/424ckymf\"
url=\"http:__www.scis.org.uk_search_menu_new.asp.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/clez/425clezz\"
url=\"http:__www.uk-wholesaler.co.uk_softbook_clickbankmembership_clickbankprotector.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/clsl/426clslk\"
url=\"http:__www.blewa.co.uk_project5_teachers_T5-0-1.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cmna/427cmnal\"
url=\"http:__www.politicalwizard.co.uk_administration_childsocnew_index.php?category=campaigns&c=i&uid=2130.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cnos/428cnosx\"
url=\"http:__www.kent-ccc.co.uk_news_story.php?id=660.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cnoz/429cnozg\"
url=\"http:__beehive.thisisexeter.co.uk_default.asp?WCI=SiteHome&ID=9908&PageID=56638.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cnqw/430cnqwk\"
url=\"http:__bookshop.blackwell.co.uk_jsp_id_0340894342_Divine_Madness.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cntu/431cntup\"
url=\"http:__www.newble.co.uk_chalmers_innes.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cody/432codym\"
url=\"http:__www.searchenginespy.co.uk_article0027.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/coip/433coipg\"
url=\"http:__www.scottishcorpus.ac.uk_corpus_search_document.php?documentid=1211.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cplj/434cpljw\"
url=\"http:__www.peterhead.org.uk_familyheritage_forum_topic.asp?TOPIC_ID=26&.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cpnw/435cpnwa\"
url=\"http:__www.frenchhouserestoration.co.uk_franceproperty150to200_propertyandhousesforsalelimousinabn0509263.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cqha/436cqham\"
url=\"http:__www.rcpsych.ac.uk_college_faculties_liaison_documents_servicedevelopment_managerialfacilities.aspx.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cqng/437cqngo\"
url=\"http:__www.tlchm.bris.ac.uk_safety_various_rass_kmweb_safety_msds.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cqrd/438cqrdh\"
url=\"http:__www.msabritain.co.uk_index.php?id=23&L=3&article=13.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/crkw/439crkwd\"
url=\"http:__www.frontier.net.uk_FAQsearch.asp?search_strFields=strMetaKeywords&search_strType=FAQS&search_strAreaNo=1053,2011&strKeyword=PS2006_4_3.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/crsr/440crsrx\"
url=\"http:__www.itreviews.co.uk_games_g232.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/csah/441csahf\"
url=\"http:__www.petergasston.co.uk_2002_09_to-quote-the-four-seasons.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/csct/442csctp\"
url=\"http:__www.kevinmayhew.co.uk_Mobile_default.aspx?group_id=16538&article_id=21979.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/csmw/443csmwd\"
url=\"http:__www.ceac.aston.ac.uk_research_staff_jpf_papers_paper26_index.php.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/csqc/444csqcw\"
url=\"http:__www.all-energy.co.uk_newsletter45.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/csxj/445csxju\"
url=\"http:__socialistworker.org.uk_article.php?article_id=8138.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/ctcu/446ctcuk\"
url=\"http:__www.setdanceteacher.co.uk_newmarketmez.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/ctfd/447ctfdn\"
url=\"http:__www.ebi.ac.uk_interpro_DisplayIproEntry?ac=IPR002824.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/ctgo/448ctgol\"
url=\"http:__www.garthyfog.co.uk_mawddach_valley.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cuua/258cuua\"
url=\"http:__www.swcc.org.uk_caving_expeditions_jura05_jura_circ1.php.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cvbw/449cvbwe\"
url=\"http:__www.oca-online.co.uk_viewnews.cfm?news_id=177.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cvgk/450cvgkz\"
url=\"http:__www.chichester.co.uk_mk4CustomPages_CustomPage.aspx?PageID=24163§ionID=4585.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cvqe/451cvqer\"
url=\"http:__www.webstar.co.uk_~musnews_news_search.php?search=&start=12080.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cwbp/452cwbpn\"
url=\"http:__www.linc4info.org.uk_cms_pages_sitemap.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cwcq/453cwcqx\"
url=\"http:__www.ccp4.ac.uk_courses_IUCr2005_index.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cwde/454cwdel\"
url=\"http:__www.perceptive-engineering.co.uk_html_training.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cwhb/455cwhbc\"
url=\"http:__www.lanpac.co.uk_csi.php.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cwma/456cwmaf\"
url=\"http:__www.chisenhale.org.uk_html_files_501_project_info.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cwzw/457cwzwc\"
url=\"http:__www.ilnpictures.co.uk_showpage.asp?showdocumentid=196.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cxnk/458cxnko\"
url=\"http:__www.starlink.rl.ac.uk_star_docs_sun232.htx_node17.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cxxy/459cxxyp\"
url=\"http:__www.publications.parliament.uk_pa_cm199900_cmhansrd_vo000405_debtext_00405-07.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/cyyc/460cyyci\"
url=\"http:__www.dwalker.pwp.blueyonder.co.uk_Fasti%20V.2_p.%20278%20PRESBYTERY%20OF%20PENPONT%20p.%20672.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/czqo/461czqoj\"
url=\"http:__www.wessingtoncryogenics.co.uk_serv01.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/czve/462czvea\"
url=\"http:__www.aylesburyvale.gov.uk_avdc_content_index.jsp?contentid=1999276669.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dagx/463dagxc\"
url=\"http:__www.stratford-upon-avon.co.uk_static_481.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/danu/464danug\"
url=\"http:__www.synergygroup.co.uk_office-support-recruitment_.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/daqq/465daqqs\"
url=\"http:__www.sexshop365.co.uk_catalog_product_info.php?products_id=2981.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/daws/466dawss\"
url=\"http:__www.honda-racing.co.uk_fourwheels_formula1_article.asp?a=1327.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dbbq/467dbbqw\"
url=\"http:__www.bioinformatics.leeds.ac.uk_~david_docs_api_javax_swing_JSplitPane.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dbhi/468dbhia\"
url=\"http:__www.ateonline.co.uk_60_66_67_articles_7335.php.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dbjz/469dbjza\"
url=\"http:__www.iae.co.uk_news_designedforthejob.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dbzi/470dbzic\"
url=\"http:__www.oaa.org.uk_Case_Studies_studies_Ford3_Ford3.asp.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dccp/471dccpz\"
url=\"http:__www.jamesgourmetcoffee.co.uk_product.php?xProd=21&xSec=22.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dcon/472dcont\"
url=\"http:__www.uservision.co.uk_usability_aboutus_usability_aboutus.asp.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dcqe/473dcqen\"
url=\"http:__www.learnenglish.org.uk_crazyworld_series2_crazyworld_story.asp?latestchapter=12&subarea=11.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dcsp/474dcspt\"
url=\"http:__www.guysherratt.co.uk_pages_searchdetails.asp?ID=776.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dddx/475dddxm\"
url=\"http:__www.menshealthforum.org.uk_userpage1.cfm?item_id=1913.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/ddqu/476ddquk\"
url=\"http:__www.schoolhouse.org.uk_law_not_enrolled.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/deck/477decku\"
url=\"http:__www.womenintothenetwork.co.uk_page_calendar_archive_article.cfm?articleId=52.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/decp/478decpr\"
url=\"http:__www.lathes.co.uk_beaver_page5.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dehf/479dehfj\"
url=\"http:__www.hasslefreeminiatures.co.uk_rules.php.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/deqg/480deqgv\"
url=\"http:__www.newworknetwork.org.uk_modules_event_viewevent.php?eveid=109.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/derj/481derjo\"
url=\"http:__www.cheatgenius.co.uk_cheats_641_Gamecube-cheats_Gamecube-(hardware)-Cheats.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dfnm/482dfnmt\"
url=\"http:__www.omega.co.uk_ppt_pptsc.asp?ref=LE902.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dfoo/483dfoor\"
url=\"http:__www.fulcrum-anglican.org.uk_forum_poster.cfm?sort=creatasc&poster=101.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dfvl/484dfvlp\"
url=\"http:__www.la-hq.org.uk_directory_prof_issues_blreview.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dfzy/485dfzyc\"
url=\"http:__www.billyarmstrong.co.uk_050613_public_urged_to_back_london's_olympic_2012_bid.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dgmo/486dgmor\"
url=\"http:__chat.dailymail.co.uk_dailymail_threadnonInd.jsp?forum=106&thread=9757638&message=11724737.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dgti/487dgtix\"
url=\"http:__www.thebookpeople.co.uk_webapp_wcs_stores_servlet_product_10001_10051_20553_100_10012_10010_category_10010.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dgws/488dgwsx\"
url=\"http:__www.bjhc.co.uk_news_industry_2005_ind505016.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dgzt/489dgztd\"
url=\"http:__www.uea.ac.uk_eas_events_litfestspr04.shtml.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dheb/490dhebu\"
url=\"http:__www.kimberry.co.uk_Dotnetlectures_Index.aspx.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dheg/491dhegq\"
url=\"http:__www.lathes.co.uk_wolfjahnmiller_page2.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dhem/492dhemc\"
url=\"http:__www.humanism.org.uk_site_cms_newsarticleview.asp?article=2173.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/dhow/493dhowh\"
url=\"http:__www.anweb.co.uk_l_04_c3_c3a10.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/eizz/259eizz\"
url=\"http:__www.royalhigh.edin.sch.uk_content_subject_modernlanguages_course_s1s2.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/fodw/260fodw\"
url=\"http:__www.law.warwick.ac.uk_ltj_4-1m.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/fvms/261fvms\"
url=\"http:__www.citizenshipfoundation.org.uk_main_news.php?n20.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/guzs/262guzs\"
url=\"http:__www.arnside-online.co.uk_care.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/hhvw/263hhvw\"
url=\"http:__www.oarsport.co.uk_products_leatherman_micra.php.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/hkay/264hkay\"
url=\"http:__www.bnp.org.uk_columnists_docdiary2.php?docId=103.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/hzbi/265hzbi\"
url=\"http:__www.familiesonline.co.uk_article_articleview_1733_1_153.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/kbmr/266kbmr\"
url=\"http:__www.ladybird-survey.pwp.blueyonder.co.uk_P_mugo.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/kjkq/267kjkq\"
url=\"http:__www.free-internet.co.uk_email_sendmail.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/kzix/268kzix\"
url=\"http:__www.cs.bham.ac.uk_resources_ums_PythonDoc_api_threads.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/lfwv/269lfwv\"
url=\"http:__www.thisismoney.co.uk_news_columnists_article.html?in_article_id=405873&in_page_id=50002.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/ljrm/270ljrm\"
url=\"http:__www.learningservices.gcal.ac.uk_synergy_03_scwbl.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/lptf/271lptf\"
url=\"http:__www.nisp.co.uk_pooled_articles_BF_NEWSART_view.asp?Q=BF_NEWSART_95582.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/lqyu/272lqyu\"
url=\"http:__www.mountainsoftware.co.uk_printpage.asp?REF=_group.asp.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/mail/273mail\"
url=\"http:__www.dba.org.uk_aboutdba_chriswood.asp.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/mpxl/274mpxl\"
url=\"http:__www.surefish.co.uk_culture_books_0804_110804_food_books.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/mtps/275mtps\"
url=\"http:__www.newtsnni.gov.uk_actionplan_04b.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/mtqb/276mtqb\"
url=\"http:__www.hummersknott.org.uk_Stud_Res_Info_Tec_Info_ICT_KS3_databases_relational_databases.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/ndi\"/247ndi\"
url=\"http:__www.stockportmbc.gov.uk_secondary_offerton_pages_SchemesofWork_KS4_skillswl.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/odv\"/248odv\"
url=\"http:__www.find-me-a-gift.co.uk_gifts-for-men_unusual-gadgets_mood-light-tile.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/omzz/277omzz\"
url=\"http:__www.swindon-speedway.co.uk_modules.php?op=modload&name=News&file=article&sid=175&mode=thread&order=0&thold=0.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/oojb/278oojb\"
url=\"http:__www.engender.org.uk_justice.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/opab/279opab\"
url=\"http:__www.heros.org.uk_home_sub.asp?page=2.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/orle/280orle\"
url=\"http:__www.bsg.org.uk_clinical_prac_mar_05_mar05_08.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/osor/281osor\"
url=\"http:__www.cdp.bham.ac.uk_About_CDP_methods.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/pabf/282pabf\"
url=\"https:__www.cambs-police.co.uk_caminfo_blueprint_articles.asp?ID=807.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/pkbn/283pkbn\"
url=\"http:__www.hmso.gov.uk_legislation_scotland_acts2002_20017--b.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/pxnz/284pxnz\"
url=\"http:__www.dog-pictures.co.uk_dog-pictures_shiba_inu.shtml.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/qsym/285qsym\"
url=\"http:__www.strawbale-building.co.uk_index.php?page=faq.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/qvpo/286qvpo\"
url=\"http:__company.monster.co.uk_londonunderuk_tfl_our_careers.asp.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/rfk\"/249rfk\"
url=\"http:__www.environment.bham.ac.uk_extindex.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/rfkm/287rfkm\"
url=\"http:__www.artshole.co.uk_exhibitions_Aug%2006%2004_James%20Cauty.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/rivm/288rivm\"
url=\"http:__www.sincuser.f9.co.uk_050_lastwrd.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/rkwj/289rkwj\"
url=\"http:__www.ocdaction.org.uk_skin-picking.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/rlwz/290rlwz\"
url=\"http:__www.greenparty.org.uk_news_2033.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/rnce/291rnce\"
url=\"http:__www.lel.ed.ac.uk_linguist_issues_17_17-229.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/sbdw/292sbdw\"
url=\"http:__sccplugins.sheffield.gov.uk_press_news_aRelease.asp?akey=2026&Mon=01_07_2004.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/sbqp/293sbqp\"
url=\"http:__www.lpt.nhs.uk_service5.php.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/seaz/294seaz\"
url=\"http:__www.panos.org.uk_resources_reportdetails.asp?id=1039.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/smar/295smar\"
url=\"http:__www.arctech.co.uk_siemens_hosted_exchange.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/sqdo/296sqdo\"
url=\"http:__gimbo.org.uk_archives_2006_01_chomsky_intervi.html.txt"
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/0syndicate_bmw-s-and-chinese-justice.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/10syndicate_france-s-fourth-moment.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/11syndicate_fran-ois-hollande-s-wrong-idea-of-france-by-brigitte-granville.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/12syndicate_hollywood-s-favorite-villains.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/13syndicate_japanese-lessons-for-china-s-currency.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/14syndicate_kennedy--khrushchev--the-cuban-missile-crisis-and-nuclear-deterrence-from-cuba-to-iran-by-joseph-s--nye.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/15syndicate_merkel-in-china-by-sanjaya-baru.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/16syndicate_ms--europe-or-frau-germania-.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/17syndicate_reshaping-china-s-government-services-supply-chain-by-andrew-sheng-and-geng-xiao.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/18syndicate_russia-s-ukrainian-path-to-the-future.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/19syndicate_should-europe-regulate-sovereign-wealth-funds-.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/1syndicate_china-and-a-new-balance-of-power.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/20syndicate_the--browning--of-african-technology.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/21syndicate_the-china-question.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/22syndicate_the-end-of-the-russia-china-debate.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/23syndicate_the-making-of-china-s-trade-deficit.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/24syndicate_the-return-of-franco-german-leadership.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/25syndicate_the-transatlantic-index.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/26syndicate_will-russia-save-the-west-.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/2syndicate_china-and-russia-in-the-new-world-disorder.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/3syndicate_china-japan-protests-islands-by-liah-greenfeld.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/4syndicate_china-s-cyber-warriors.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/5syndicate_china-s-gift-to-europe.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/6syndicate_china-s-threat-to-russia.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/7syndicate_europe-s-vital-french-connection-by-kemal-dervi.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/8syndicate_exchange-rate-disorder.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/synd/9syndicate_france-and-germany-must-act-in-iraq.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/140ted_a_j_jacobs_year_of_living_biblically.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/141ted_alan_kay_shares_a_powerful_idea_about_ideas.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/142ted_alex_tabarrok_foresees_economic_growth.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/143ted_amy_tan_on_creativity.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/144ted_barry_schwartz_on_the_paradox_of_choice.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/145ted_benjamin_wallace_on_the_price_of_happiness.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/146ted_bono_s_call_to_action_for_africa.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/147ted_dan_dennett_cute_sexy_sweet_funny.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/148ted_daniel_kraft_invents_a_better_way_to_harvest_bone_marrow.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/149ted_dave_eggers_makes_his_ted_prize_wish_once_upon_a_school.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/150ted_don_norman_on_design_and_emotion.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/151ted_doris_kearns_goodwin_on_learning_from_past_presidents.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/152ted_elliot_krane_the_mystery_of_chronic_pain.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/153ted_eva_zeisel_on_the_playful_search_for_beauty.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/154ted_ex_moonie_diane_benscoter_how_cults_think.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/155ted_hans_rosling_at_state.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/156ted_helen_fisher_tells_us_why_we_love_cheat.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/157ted_isabel_allende_tells_tales_of_passion.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/158ted_jessi_arrington_wearing_nothing_new.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/159ted_john_underkoffler_drive_3d_data_with_a_gesture.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/160ted_joseph_lekuton_tells_a_parable_for_kenya.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/161ted_julia_sweeney_has_the_talk.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/162ted_ken_robinson_says_schools_kill_creativity.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/163ted_marcin_jakubowski.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/164ted_mary_roach_10_things_you_didn_t_know_about_orgasm.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/165ted_michael_sandel_the_lost_art_of_democratic_debate.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/166ted_michael_shermer_on_believing_strange_things.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/167ted_misha_glenny_investigates_global_crime_networks.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/168ted_oliver_sacks_what_hallucination_reveals_about_our_minds.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/169ted_rebecca_saxe_how_brains_make_moral_judgments.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/170ted_robert_thurman_on_compassion.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/171ted_rory_sutherland_life_lessons_from_an_ad_man.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/172ted_sean_gourley_on_the_mathematics_of_war.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/173ted_siegfried_woldhek_shows_how_he_found_the_true_face_of_leonardo.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/174ted_stephen_wolfram_computing_a_theory_of_everything.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/175ted_tom_wujec_build_a_tower.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/176ted_tom_wujec_on_3_ways_the_brain_creates_meaning.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/ted/177ted_william_li.txt
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/tkhv/297tkhv\"
url=\"http:__www.company-wizard.co.uk_SEO_Link-Exchange.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/tlg\"/250tlg\"
url=\"http:__www.ourpartnership.org.uk_newspub_story.cfm?id=353&sid=123.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/togq/298togq\"
url=\"http:__www.hearingconcern.org.uk_news_news_scots06.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/tqru/299tqru\"
url=\"http:__histru.bournemouth.ac.uk_Oral_History_Technology_in_the_Community_Joan_Wolstenholme.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/uclj/300uclj\"
url=\"http:__beehive.thisislincolnshire.co.uk_default.asp?WCI=SiteHome&ID=4337&PageID=21591.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/uijm/301uijm\"
url=\"http:__www.galha.freeserve.co.uk_glh_233_mckenna.html.txt"
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/A/178un_A_AC252_L13.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/A/179un_A_C3_61_L17.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/A/180un_APLC_MSP2_2000_1.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/C/181un_CCW_APII_CONF4_SR2.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/C/182un_CD_1605.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/C/183un_CD_1606.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/C/184un_CD_1672.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/C/185un_CD_PV1080.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/C/186un_CD_PV1157.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/C/187un_CD_PV857.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/C/188un_CD_PV861.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/C/189un_CEDAW_C_2002_II_3_ADD2.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/C/190un_CES_SEM52_2.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/C/191un_CES_SEM52_3.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/C/192un_CLCS_34.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/C/193un_CRC_GC_2003_4.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/D/194un_DP_2002_34.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/E/195un_E_C16_2002_2.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/E/196un_E_CN17_2002_PC2_19.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/E/197un_E_CN3_2003_25.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/E/198un_E_CN4_2003_G_12.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/E/199un_E_CN4_2004_G_21.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/F/200un_FCCC_SBI_2002_15.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/F/201un_FCCC_SBI_2002_9.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/F/202un_FCCC_SBI_2004_L27.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/H/203un_HRI_CORE_1_ADD117.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/H/204un_HRI_CORE_1_ADD123.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/H/205un_HSP_GC_19_2_ADD2.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/I/206un_IDB25_6.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/I/207un_IDB35_13.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/I/208un_ISBA_8_A_1.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/N/209un_NPT_CONF2005_PCI_10.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/P/210un_PBC24_1_ADD1.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/P/211un_PBC24_4-IDB35_4.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/P/212un_PBC_2_SLE_9.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/P/213un_PCNICC_2000_1_ADD1.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/P/214un_PCNICC_2001_WGAPIC_L1.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/215un_S_2000_475.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/216un_S_2000_817.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/217un_S_2001_1038-A_56_521.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/218un_S_2001_1039.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/219un_S_2001_1317.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/220un_S_2001_70-A_55_740.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/221un_S_2001_947.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/222un_S_2002_1141.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/223un_S_2002_1180.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/224un_S_2002_238-A_56_858.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/225un_S_2002_313-A_56_888.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/226un_S_2002_573-A_56_960.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/227un_S_2003_326-A_ES-10_222.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/228un_S_2006_490.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/229un_S_2009_208-A_63_820.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/230un_SAICM_ICCM2_INF_18.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/231un_S_PV4596.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/232un_S_PV4646.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/233un_S_PV4684RESUMPTION1.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/234un_S_PV4736.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/235un_S_PV4903.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/236un_S_PV4944.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/237un_S_PV5627.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/S/238un_ST_SGB_2002_9.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/T/239un_TD_B_49_11.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/T/240un_TD_B_49_SC2_L1.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/T/241un_TD_B_COM3_54.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/T/242un_TD_B_EX28_L1.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/T/243un_TESTGVADUTY001.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/U/244un_UNEP_GC_22_8_ADD2.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/U/245un_UNEP_GC_24_2.txt
delete mode 100644
opennlp-similarity/src/test/resources/style_recognizer/txt/un/U/246un_UNEP_POPS_INC6_22.txt
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/vgzh/302vgzh\"
url=\"http:__www.societies.stir.ac.uk_sppa_sppa_responsibilities.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/vihv/303vihv\"
url=\"http:__three.co.uk_customer_terms_index.omp?cid=1146151223400.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/wcnf/304wcnf\"
url=\"http:__culturemachine.tees.ac.uk_Cmach_Backissues_j005_Articles_hall.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/wkut/305wkut\"
url=\"http:__www.craigmurray.co.uk_archives_2006_06_met_chief_could.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/wrrh/306wrrh\"
url=\"http:__www.fenews.co.uk_newsview.asp?n=1014.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/wxqy/307wxqy\"
url=\"http:__www2.newsquest.co.uk_the_north_east_petscorner_news_140106.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/xmyp/308xmyp\"
url=\"http:__www.nursingbra.co.uk_emma_jane.htm.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/xqf\"/251xqf\"
url=\"http:__www.macintyrecharity.org.uk_our_services_inclusive_care_worcestershire_easemore_road.html.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/xvwn/309xvwn\"
url=\"http:__www.paramountcomedy2.co.uk_comedy_comedians_comedian.aspx?id=429.txt"
delete mode 100644
"opennlp-similarity/src/test/resources/style_recognizer/txt/ygug/310ygug\"
url=\"http:__www.seequality.org.uk_gender.html.txt"
delete mode 100644
opennlp-similarity/src/test/resources/tree_kernel/action-plan-doc-list.csv
delete mode 100644
opennlp-similarity/src/test/resources/tree_kernel/svm.run.mac.zip
delete mode 100755
opennlp-similarity/src/test/resources/tree_kernel/svm_classify
delete mode 100644
opennlp-similarity/src/test/resources/tree_kernel/svm_classify.exe
delete mode 100644
opennlp-similarity/src/test/resources/tree_kernel/svm_classify.linux
delete mode 100755 opennlp-similarity/src/test/resources/tree_kernel/svm_learn
delete mode 100644
opennlp-similarity/src/test/resources/tree_kernel/svm_learn.exe
delete mode 100644
opennlp-similarity/src/test/resources/tree_kernel/training_pos_neg_sentiment.txt
delete mode 100644
opennlp-similarity/src/test/resources/tree_kernel/tree_kernel.zip
create mode 100644 pom.xml
rename corpus-server-impl/feature.xml => rat-excludes (65%)
delete mode 100644 summarizer/src/test/resources/wordnet/LICENSE
delete mode 100644 summarizer/src/test/resources/wordnet/README
delete mode 100644 summarizer/src/test/resources/wordnet/dict/adj.exc
delete mode 100644 summarizer/src/test/resources/wordnet/dict/adv.exc
delete mode 100644 summarizer/src/test/resources/wordnet/dict/data.adj
delete mode 100644 summarizer/src/test/resources/wordnet/dict/data.adv
delete mode 100644 summarizer/src/test/resources/wordnet/dict/data.noun
delete mode 100644 summarizer/src/test/resources/wordnet/dict/data.verb
delete mode 100644 summarizer/src/test/resources/wordnet/dict/frames.vrb
delete mode 100644 summarizer/src/test/resources/wordnet/dict/index.adj
delete mode 100644 summarizer/src/test/resources/wordnet/dict/index.adv
delete mode 100644 summarizer/src/test/resources/wordnet/dict/index.noun
delete mode 100644 summarizer/src/test/resources/wordnet/dict/index.sense
delete mode 100644 summarizer/src/test/resources/wordnet/dict/index.verb
delete mode 100644 summarizer/src/test/resources/wordnet/dict/lexnames
delete mode 100644 summarizer/src/test/resources/wordnet/dict/noun.exc
delete mode 100644 summarizer/src/test/resources/wordnet/dict/sentidx.vrb
delete mode 100644 summarizer/src/test/resources/wordnet/dict/sents.vrb
delete mode 100644 summarizer/src/test/resources/wordnet/dict/verb.Framestext
delete mode 100644 summarizer/src/test/resources/wordnet/dict/verb.exc