Added: stanbol/branches/STANBOL-1279/entitycoreference/src/main/resources/config/named_entity.properties URL: http://svn.apache.org/viewvc/stanbol/branches/STANBOL-1279/entitycoreference/src/main/resources/config/named_entity.properties?rev=1643760&view=auto ============================================================================== --- stanbol/branches/STANBOL-1279/entitycoreference/src/main/resources/config/named_entity.properties (added) +++ stanbol/branches/STANBOL-1279/entitycoreference/src/main/resources/config/named_entity.properties Mon Dec 8 08:03:19 2014 @@ -0,0 +1,7 @@ +# Properties of an Entity that will be matched against when doing the coreference +spatial.ont.person.attributes=http://dbpedia.org/ontology/birthPlace,http://dbpedia.org/ontology/region,http://dbpedia.org/ontology/nationality,http://dbpedia.org/ontology/country +spatial.ont.organisation.attributes=http://dbpedia.org/ontology/foundationPlace,http://dbpedia.org/ontology/locationCity,http://dbpedia.org/ontology/location,http://dbpedia.org/ontology/hometown +spatial.ont.place.attributes=http://dbpedia.org/ontology/country,http://dbpedia.org/ontology/subdivisionName,http://dbpedia.org/ontology/location + +# Entity classes that will be excluded when doing the coreference because they are too generic. +entity.classes.to.exclude=http://dbpedia.org/ontology/Person,http://dbpedia.org/class/yago/LivingThing100004258,http://dbpedia.org/class/yago/PhysicalEntity100001930,http://dbpedia.org/class/yago/Abstraction100002137,http://dbpedia.org/class/yago/Organism100004475,http://dbpedia.org/class/yago/Location100027167,http://schema.org/Place,http://dbpedia.org/class/yago/Object100002684,http://dbpedia.org/class/yago/YagoGeoEntity,http://www.w3.org/2002/07/owl#Thing,http://dbpedia.org/class/yago/YagoPermanentlyLocatedEntity \ No newline at end of file
Added: stanbol/branches/STANBOL-1279/entitycoreference/src/main/resources/config/pos/en.properties URL: http://svn.apache.org/viewvc/stanbol/branches/STANBOL-1279/entitycoreference/src/main/resources/config/pos/en.properties?rev=1643760&view=auto ============================================================================== --- stanbol/branches/STANBOL-1279/entitycoreference/src/main/resources/config/pos/en.properties (added) +++ stanbol/branches/STANBOL-1279/entitycoreference/src/main/resources/config/pos/en.properties Mon Dec 8 08:03:19 2014 @@ -0,0 +1,2 @@ +# Determiners of a noun phrase which determine that the noun phrase is a good candidate for coref. +within.text.referencing.determiners=the,this,these \ No newline at end of file Added: stanbol/branches/STANBOL-1279/entitycoreference/src/main/resources/data/place_adjectivals/config.properties URL: http://svn.apache.org/viewvc/stanbol/branches/STANBOL-1279/entitycoreference/src/main/resources/data/place_adjectivals/config.properties?rev=1643760&view=auto ============================================================================== --- stanbol/branches/STANBOL-1279/entitycoreference/src/main/resources/data/place_adjectivals/config.properties (added) +++ stanbol/branches/STANBOL-1279/entitycoreference/src/main/resources/data/place_adjectivals/config.properties Mon Dec 8 08:03:19 2014 @@ -0,0 +1,2 @@ +# The Base URL for place adjetival entities +entity.uri.base=http://dbpedia.org/resource/ \ No newline at end of file Added: stanbol/branches/STANBOL-1279/entitycoreference/src/main/resources/data/place_adjectivals/en URL: http://svn.apache.org/viewvc/stanbol/branches/STANBOL-1279/entitycoreference/src/main/resources/data/place_adjectivals/en?rev=1643760&view=auto ============================================================================== --- stanbol/branches/STANBOL-1279/entitycoreference/src/main/resources/data/place_adjectivals/en (added) +++ stanbol/branches/STANBOL-1279/entitycoreference/src/main/resources/data/place_adjectivals/en Mon Dec 8 08:03:19 2014 @@ -0,0 +1,236 @@ +Abkhazia Abkhaz, Abkhazian +Afghanistan Afghan +Albania Albanian +Algeria Algerian +American_Samoa American Samoan +Andorra Andorran +Angola Angolan +Anguilla Anguillan +Antigua_and_Barbuda Antiguan, Barbudan +Argentina Argentine, Argentinean, Argentinian +Armenia Armenian +Aruba Aruban +Australia Australian +Austria Austrian +Azerbaijan Azerbaijani, Azeri +Bahamas Bahamian +Bahrain Bahraini +Bangladesh Bangladeshi +Barbados Barbadian +Belarus Belarusian +Belgium Belgian +Belize Belizean +Benin Beninese, Beninois +Bermuda Bermudian, Bermudan +Bhutan Bhutanese +Bolivia Bolivian +Bosnia_and_Herzegovina Bosnian, Bosniak, Herzegovinian +Botswana Motswana, Botswanan +Brazil Brazilian +British Virgin Islands British Virgin Island +Brunei Bruneian +Bulgaria Bulgarian +Burkina_Fasoa Burkinabè +Burmab Burmese +Burundi Burundian +Cambodia Cambodian +Cameroon Cameroonian +Canada Canadian +Cape_Verde Cape Verdean +Cayman_Islands Caymanian +Central_African_Republic Central African +Chad Chadian +Chile Chilean +China Chinese +Christmas_Island Christmas Island +Cocos_Islands Cocos Island +Colombia Colombian +Comoros Comorian +Congo Congolese, Congo +Cook_Islands Cook Island, Cook Islands +Costa_Rica Costa Rican +Côte_d'Ivoire Ivorian +Croatia Croatian +Cuba Cuban +Cyprus Cypriot +Czech_Republic Czech +Denmark Danish +Djibouti Djiboutian +Dominica Dominicand +Dominican_Republic Dominicane +East_Timor Timorese +Ecuador Ecuadorian +Egypt Egyptian +El_Salvador Salvadoran +England English +Equatorial_Guinea Equatorial Guinean, Equatoguinean +Eritrea Eritrean +Estonia Estonian +Ethiopia Ethiopian +Falkland_Islands Falkland Island +Faroe_Islands Faroese +Fiji Fijian +Finland Finnish +France French +French_Guiana French Guianese +French_Polynesia French Polynesian +Gabon Gabonese +Gambia Gambian +Georgia Georgian +Germany German +Ghana Ghanaian +Gibraltar Gibraltar +Great_Britain British +Greece Greek, Greciang, Hellenic +Greenland Greenlandic +Grenada Grenadian +Guadeloupe Guadeloupe +Guam Guamanian, Guambat +Guatemala Guatemalan +Guinea Guinean +Guyana Guyanese +Haiti Haitian +Honduras Honduran +Hong_Kong Hong Kong, Hongkongese +Hungary Hungarian, Magyar +Iceland Icelandic +India Indian +Indonesia Indonesian +Iran Iranian, Persian +Iraq Iraqi +Ireland Irish +Isle_of_Man Manx +Israel Israeli +Italy Italian, Italic +Jamaica Jamaican +Japan Japanese +Jordan Jordanian +Kazakhstan Kazakh, Kazakhstani +Kenya Kenyan +Kiribati I-Kiribati +North_Korea North Korean +South_Korea South Korean +Kosovo Kosovar, Kosovan +Kuwait Kuwaiti +Kyrgyzstan Kyrgyzstani, Kyrgyz, Kirgiz, Kirghiz +Laos Laotian, Lao +Latvia Latvian +Lebanon Lebanese +Lesotho Basotho +Liberia Liberian +Libya Libyan +Liechtenstein Liechtenstein +Lithuania Lithuanian +Luxembourg Luxembourg, Luxembourgish +Macau Macanese, Chinese +Macedonia Macedonian +Madagascar Malagasy +Malawi Malawian +Malaysia Malaysian +Maldives Maldivian +Mali Malian +Malta Maltese +Marshall Islands Marshallese +Martinique Martiniquais, Martinican +Mauritania Mauritanian +Mauritius Mauritian +Mayotte Mahoran +Mexico Mexican +Micronesia Micronesian +Moldova Moldovan +Monaco Monégasque, Monacan +Mongolia Mongolian +Montenegro Montenegrin +Montserrat Montserratian +Morocco Moroccan +Mozambique Mozambican +Namibia Namibian +Nauru Nauruan +Nepal Nepalese, Nepali +Netherlands Dutch, Netherlandic +New_Caledonia New Caledonian +New_Zealand New Zealand, NZ +Nicaragua Nicaraguan +Niue Niuean +Niger Nigerien +Nigeria Nigerian +Norway Norwegian +Northern_Ireland Northern Irish, Irish +Northern_Marianas Northern Marianan +Oman Omani +Pakistan Pakistani +Palestine Palestinian +Palau Palauan +Panama Panamanian +Papua_New_Guinea Papua New Guinean, Papuan +Paraguay Paraguayan +Peru Peruvian +Philippines Philippine, Filipino +Pitcairn_Island Pitcairn Island +Poland Polish +Portugal Portuguese +Puerto_Rico Puerto Rican +Qatar Qatari +Ireland Irish +Réunion Réunionese, Réunionnais +Romania Romanian +Russia Russian +Rwanda Rwandan +St._Helena St. Helenian +St._Kitts_and_Nevis Kittitian, Nevisian +St._Lucia St. Lucian +Saint-Pierre_and_Miquelon Saint-Pierrais, Miquelonnais +St._Vincent_and_the_Grenadines St. Vincentian, Vincentian +Samoa Samoan +San_Marino Sammarinese +São_Tomé_and_Príncipe São Toméan +Saudi_Arabia Saudi, Saudi Arabian +Scotland Scots, Scottish, Scotchi +Senegal Senegalese +Serbia Serbian +Seychelles Seychellois +Sierra_Leone Sierra Leonean +Singapore Singaporean +Slovakia Slovak +Slovenia Slovenian, Slovene +Solomon_Islands Solomon Island +Somalia Somali, Somalian +South_Africa South African +South_Ossetia South Ossetian +South_Sudan South Sudanese +Spain Spanish +Sri_Lanka Sri Lankan +Sudan Sudanese +Surinam Surinamese +Swaziland Swazi +Sweden Swedish +Switzerland Swiss +Syria Syrian +Taiwan Taiwanese +Tajikistan Tajikistani +Tanzania Tanzanian +Thailand Thai +Togo Togolese +Tonga Tongan +Trinidad_and_Tobago Trinidadian, Tobagonian +Tunisia Tunisian +Turkey Turkish +Turkmenistan Turkmen +Tuvalu Tuvaluan +Uganda Ugandan +Ukraine Ukrainian +United_Arab_Emirates Emirati, Emirian +United_Kingdom British, UK +United_States American, US +Uruguay Uruguayan +Uzbekistan Uzbekistani, Uzbek +Vanuatu Ni-Vanuatu, Vanuatuan +Venezuela Venezuelan +Vietnam Vietnamese +Virgin_Islands Virgin Island +Wales Welsh +Wallis_and_Futuna Wallisian, Futunan +Western_Sahara Sahraw, Sahrawian, Sahraouian +Yemen Yemeni +Zambia Zambian +Zimbabwe Zimbabwean \ No newline at end of file Added: stanbol/branches/STANBOL-1279/entitycoreference/src/test/resources/log4j.properties URL: http://svn.apache.org/viewvc/stanbol/branches/STANBOL-1279/entitycoreference/src/test/resources/log4j.properties?rev=1643760&view=auto ============================================================================== --- stanbol/branches/STANBOL-1279/entitycoreference/src/test/resources/log4j.properties (added) +++ stanbol/branches/STANBOL-1279/entitycoreference/src/test/resources/log4j.properties Mon Dec 8 08:03:19 2014 @@ -0,0 +1,24 @@ +# Licensed to the Apache Software Foundation (ASF) under one or more +# contributor license agreements. See the NOTICE file distributed with +# this work for additional information regarding copyright ownership. +# The ASF licenses this file to You under the Apache License, Version 2.0 +# (the "License"); you may not use this file except in compliance with +# the License. You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. + +# Root logger option +log4j.rootLogger=INFO, stdout + +# Direct log messages to stdout +log4j.appender.stdout=org.apache.log4j.ConsoleAppender +log4j.appender.stdout.Target=System.out +log4j.appender.stdout.layout=org.apache.log4j.PatternLayout +log4j.appender.stdout.layout.ConversionPattern=%d{ABSOLUTE} %5p %c{1}:%L - %m%n +log4j.logger.org.apache.stanbol.enhancer.engines.keywordextraction=DEBUG \ No newline at end of file Added: stanbol/branches/STANBOL-1279/pom.xml URL: http://svn.apache.org/viewvc/stanbol/branches/STANBOL-1279/pom.xml?rev=1643760&view=auto ============================================================================== --- stanbol/branches/STANBOL-1279/pom.xml (added) +++ stanbol/branches/STANBOL-1279/pom.xml Mon Dec 8 08:03:19 2014 @@ -0,0 +1,31 @@ +<?xml version="1.0" encoding="UTF-8"?> +<!-- Licensed to the Apache Software Foundation (ASF) under one or more contributor + license agreements. See the NOTICE file distributed with this work for additional + information regarding copyright ownership. The ASF licenses this file to + You under the Apache License, Version 2.0 (the "License"); you may not use + this file except in compliance with the License. You may obtain a copy of + the License at http://www.apache.org/licenses/LICENSE-2.0 Unless required + by applicable law or agreed to in writing, software distributed under the + License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS + OF ANY KIND, either express or implied. See the License for the specific + language governing permissions and limitations under the License. --> +<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" + xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/maven-v4_0_0.xsd"> + + <modelVersion>4.0.0</modelVersion> + + <groupId>org.apache.stanbol</groupId> + <artifactId>org.apache.stanbol.stanbol1279.reactor</artifactId> + <version>1.0.0-SNAPSHOT</version> + <packaging>pom</packaging> + + <name>Apache Stanbol Entity Co-Mention Engine Reactor</name> + <description> + Reactor pom for the STANBOL-1279 reactor. + </description> + + <modules> + <module>entitycoreference</module> + </modules> + +</project>
