Author: cpetroaca
Date: Wed Jul 22 18:58:38 2015
New Revision: 1692320

URL: http://svn.apache.org/r1692320
Log:
STANBOL-1279 : Named Entity co-reference resolution engine based on 
yago/dbpedia contextual information
Added Entity Coreference Engine and the entity-coref-dbpedia data bundle.

Added:
    stanbol/trunk/data/sites/entity-coref-dbpedia/
    stanbol/trunk/data/sites/entity-coref-dbpedia/README.md
    stanbol/trunk/data/sites/entity-coref-dbpedia/dbpedia_yago_classes/
    
stanbol/trunk/data/sites/entity-coref-dbpedia/dbpedia_yago_classes/build_yago_dbpedia_labels.sh
    stanbol/trunk/data/sites/entity-coref-dbpedia/download_index.xml
    stanbol/trunk/data/sites/entity-coref-dbpedia/pom.xml
    stanbol/trunk/data/sites/entity-coref-dbpedia/src/
    stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/
    stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/appended-resources/
    
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/appended-resources/META-INF/
    
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/appended-resources/META-INF/LICENSE
    
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/appended-resources/META-INF/NOTICE
    stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/
    stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/README
    stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/
    stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/
    
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/
    
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/
    
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/
    
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/
    
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/
    
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/
    
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/entity-coref-dbpedia.solrindex.ref
    
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.core.site.CacheImpl-entity-coref-dbpedia.config
    
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.site.referencedSite-entity-coref-dbpedia.config
    
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.yard.solr.impl.SolrYard-entity-coref-dbpedia.config
    stanbol/trunk/enhancement-engines/entitycoreference/
    stanbol/trunk/enhancement-engines/entitycoreference/README.md
    stanbol/trunk/enhancement-engines/entitycoreference/pom.xml
    stanbol/trunk/enhancement-engines/entitycoreference/src/
    stanbol/trunk/enhancement-engines/entitycoreference/src/license/
    
stanbol/trunk/enhancement-engines/entitycoreference/src/license/THIRD-PARTY.properties
    stanbol/trunk/enhancement-engines/entitycoreference/src/main/
    stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/
    stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/apache/
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/apache/stanbol/
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/apache/stanbol/enhancer/
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/apache/stanbol/enhancer/engines/
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/apache/stanbol/enhancer/engines/entitycoreference/
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/apache/stanbol/enhancer/engines/entitycoreference/Constants.java
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/apache/stanbol/enhancer/engines/entitycoreference/EntityCoReferenceEngine.java
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/apache/stanbol/enhancer/engines/entitycoreference/datamodel/
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/apache/stanbol/enhancer/engines/entitycoreference/datamodel/NounPhrase.java
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/apache/stanbol/enhancer/engines/entitycoreference/datamodel/PlaceAdjectival.java
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/apache/stanbol/enhancer/engines/entitycoreference/impl/
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/apache/stanbol/enhancer/engines/entitycoreference/impl/CoreferenceFinder.java
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/apache/stanbol/enhancer/engines/entitycoreference/impl/CoreferenceFinderConfig.java
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/apache/stanbol/enhancer/engines/entitycoreference/impl/Dictionaries.java
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/apache/stanbol/enhancer/engines/entitycoreference/impl/InMemoryEntityTypeIndex.java
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/apache/stanbol/enhancer/engines/entitycoreference/impl/NounPhraseFilterer.java
    stanbol/trunk/enhancement-engines/entitycoreference/src/main/resources/
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/resources/OSGI-INF/
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/resources/OSGI-INF/metatype/
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/resources/OSGI-INF/metatype/metatype.properties
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/resources/config/
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/resources/config/pos/
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/resources/config/pos/en.properties
    stanbol/trunk/enhancement-engines/entitycoreference/src/main/resources/data/
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/resources/data/place_adjectivals/
    
stanbol/trunk/enhancement-engines/entitycoreference/src/main/resources/data/place_adjectivals/en
    stanbol/trunk/enhancement-engines/entitycoreference/src/test/
    stanbol/trunk/enhancement-engines/entitycoreference/src/test/resources/
    
stanbol/trunk/enhancement-engines/entitycoreference/src/test/resources/log4j.properties
Modified:
    stanbol/trunk/data/pom.xml
    stanbol/trunk/enhancement-engines/pom.xml

Modified: stanbol/trunk/data/pom.xml
URL: 
http://svn.apache.org/viewvc/stanbol/trunk/data/pom.xml?rev=1692320&r1=1692319&r2=1692320&view=diff
==============================================================================
--- stanbol/trunk/data/pom.xml (original)
+++ stanbol/trunk/data/pom.xml Wed Jul 22 18:58:38 2015
@@ -61,6 +61,7 @@
 
     <module>sites/dbpedia</module>
     <module>sites/dbpediacached</module>
+       <!--module>sites/entity-coref-dbpedia</module-->
 
     <module>registries/default</module>
 

Added: stanbol/trunk/data/sites/entity-coref-dbpedia/README.md
URL: 
http://svn.apache.org/viewvc/stanbol/trunk/data/sites/entity-coref-dbpedia/README.md?rev=1692320&view=auto
==============================================================================
--- stanbol/trunk/data/sites/entity-coref-dbpedia/README.md (added)
+++ stanbol/trunk/data/sites/entity-coref-dbpedia/README.md Wed Jul 22 18:58:38 
2015
@@ -0,0 +1,67 @@
+<!-- 
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+
+## Building the DbPedia 3.9 index with yago types
+
+This index will contain the yago rdf:types and several spatial/org membership 
properties from the DBpedia index.
+NOTE: At the moment the index is available only for english.
+
+### (1) Follow the instructions at entityhub/indexing/dbpedia/README.md and 
build the dbpedia index with the following configuration:
+
+#### (1) Use the RDF dumps (in N-Triple format) from :
+       http://downloads.dbpedia.org/3.9/dbpedia_3.9.owl
+       http://downloads.dbpedia.org/3.9/en/labels_en.nt.bz2
+       http://downloads.dbpedia.org/3.9/en/instance_types_en.nt.bz2
+       http://downloads.dbpedia.org/3.9/en/mappingbased_properties_en.nt.bz2
+       http://downloads.dbpedia.org/3.9/links/yago_types.nt.bz2
+       
+#### (2) The mappings.txt file must contain the following entries:
+       
+       rdfs:label | d=entityhub:text
+       rdf:type | d=entityhub:ref
+       dbp-ont:birthPlace | d=entityhub:ref
+       dbp-ont:region | d=entityhub:ref
+       dbp-ont:foundationPlace | d=entityhub:ref
+       dbp-ont:locationCity | d=entityhub:ref
+       dbp-ont:location | d=entityhub:ref
+       dbp-ont:hometown | d=entityhub:ref
+       dbp-ont:country | d=entityhub:ref
+       dbp-ont:occupation | d=entityhub:ref
+       dbp-ont:associatedBand | d=entityhub:ref
+       dbp-ont:employer | d=entityhub:ref
+       
+#### (3) Change the indexing/config/indexing.properties file to include the 
following attributes:
+       name=entity-coref-dbpedia
+       description=DBpedia.org
+
+### (2) Run the script /dbpedia_yag_classes/build_yago_dbpedia_labels.sh which 
will create the dbpedia_yago_classes_labels.nt.bz2 archive
+which contains the labels of the yago types.
+
+### (3) Follow the instructions at entityhub/indexing/genericrdf/README.md and 
rebuild the dbpedia index in order to include the
+aforementioned yago types labels. After you init the indexer but before you 
run it go through the following steps:
+
+#### (1) Copy the dbpedia_yago_classes_labels.nt.bz2 to the 
indexing\resources\rdfdata folder.
+
+#### (2) Change the indexing/config/indexing.properties to include the 
following attributes:
+       
+       name=entity-coref-dbpedia
+       description=DBpedia.org
+       
+#### (3) The indexing/config/mappings.txt file must only contain the 
rdfs:label attribute
+
+#### (4) Copy the contents of the indexing/destination folder from the results 
of point ### (1) to the /indexing/destination folder
+of the generic rdf indexing at point ### (3).

Added: 
stanbol/trunk/data/sites/entity-coref-dbpedia/dbpedia_yago_classes/build_yago_dbpedia_labels.sh
URL: 
http://svn.apache.org/viewvc/stanbol/trunk/data/sites/entity-coref-dbpedia/dbpedia_yago_classes/build_yago_dbpedia_labels.sh?rev=1692320&view=auto
==============================================================================
--- 
stanbol/trunk/data/sites/entity-coref-dbpedia/dbpedia_yago_classes/build_yago_dbpedia_labels.sh
 (added)
+++ 
stanbol/trunk/data/sites/entity-coref-dbpedia/dbpedia_yago_classes/build_yago_dbpedia_labels.sh
 Wed Jul 22 18:58:38 2015
@@ -0,0 +1,71 @@
+#!/usr/bin/env bash
+
+YAGO=http://resources.mpi-inf.mpg.de/yago-naga/yago/download/yago/
+
+files=(yagoLabels.ttl.7z \
+       yagoDBpediaClasses.ttl.7z
+    )
+YAGO_LABELS=yagoLabels.ttl
+YAGO_DBPEDIA_CLASSES=yagoDBpediaClasses.ttl
+YAGO_WORDNET_LABELS=yago_wordnet_labels
+YAGO_WORDNET_DBPEDIA_CLASSES=yago_wordnet_dbpedia_classes
+DBPEDIA_YAGO_CLASS_LABELS_NT=dbpedia_yago_classes_labels.nt
+
+# First, download and decompress the necessary yago files.
+for i in "${files[@]}"
+do
+    :
+               if [ ! -f ${i} ]; 
+               then
+                       url=${YAGO}/${i}
+                       wget -c ${url}
+               fi
+               
+               echo "Unzipping ${i}"
+               7za e ${i}
+done
+
+# Second, create a file with <wordnet_class> rdfs:label "label" format.
+grep '^<wordnet_' ${YAGO_LABELS} | grep 'rdfs:label' > ${YAGO_WORDNET_LABELS}
+
+# Third, create a file with wordnet to dbpedia yago class mappings.
+grep '^<wordnet_' ${YAGO_DBPEDIA_CLASSES} > ${YAGO_WORDNET_DBPEDIA_CLASSES}
+
+# Last, create the nt file which will contain the dbpedia yago class and its 
labels.
+touch ${DBPEDIA_YAGO_CLASS_LABELS_NT};
+
+YAGO_LABELS_NUM_LINES=$(wc -l < ${YAGO_WORDNET_LABELS})
+PROCESSED_LINES=0
+NOT_FOUND_LINES=0
+
+echo -e "\n\nStarting to process $YAGO_LABELS_NUM_LINES lines"
+
+while read line
+do
+       wordnet_class=`echo $line | awk '{print $1}'`;
+       dbpedia_class=`grep $wordnet_class $YAGO_WORDNET_DBPEDIA_CLASSES | awk 
'{split($0,a," "); print a[3]}'`;
+       
+       if [ -z "$dbpedia_class" ]
+       then
+               ((NOT_FOUND_LINES++));
+               continue;
+       fi      
+       
+       mapped_line=${line/$wordnet_class/$dbpedia_class};
+       
mapped_line_with_label=${mapped_line/rdfs:label/<http://www.w3.org/2000/01/rdf-schema#label>};
+       mapped_line_with_label_lang=${mapped_line_with_label/@eng/@en};
+       
+       echo $mapped_line_with_label_lang >> ${DBPEDIA_YAGO_CLASS_LABELS_NT};
+       
+       ((PROCESSED_LINES++));
+       echo -ne "$PROCESSED_LINES/$YAGO_LABELS_NUM_LINES processed\r";
+done < ${YAGO_WORDNET_LABELS}
+
+echo -e "\nDone processing lines. Skipped $NOT_FOUND_LINES not found dbpedia 
classes. Creating .nt archive."
+bzip2 ${DBPEDIA_YAGO_CLASS_LABELS_NT}
+
+# Cleanup
+rm ${YAGO_LABELS}
+rm ${YAGO_DBPEDIA_CLASSES}
+rm ${YAGO_WORDNET_LABELS}
+rm ${YAGO_WORDNET_DBPEDIA_CLASSES}
\ No newline at end of file

Added: stanbol/trunk/data/sites/entity-coref-dbpedia/download_index.xml
URL: 
http://svn.apache.org/viewvc/stanbol/trunk/data/sites/entity-coref-dbpedia/download_index.xml?rev=1692320&view=auto
==============================================================================
--- stanbol/trunk/data/sites/entity-coref-dbpedia/download_index.xml (added)
+++ stanbol/trunk/data/sites/entity-coref-dbpedia/download_index.xml Wed Jul 22 
18:58:38 2015
@@ -0,0 +1,32 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<project name="Index Download Helper" default="download" basedir=".">
+  <description>
+    Contains only a single target that is used by the Maven Ant
+    Plugin to download the Index parsed via 'index.url'
+    to 'target.directory'
+  </description>
+   
+  <target name="download">
+    <copy todir="${target.directory}" flatten="true">
+      <resources>
+        <url url="${index.url}"/>
+      </resources>
+    </copy>
+  </target>
+</project>

Added: stanbol/trunk/data/sites/entity-coref-dbpedia/pom.xml
URL: 
http://svn.apache.org/viewvc/stanbol/trunk/data/sites/entity-coref-dbpedia/pom.xml?rev=1692320&view=auto
==============================================================================
--- stanbol/trunk/data/sites/entity-coref-dbpedia/pom.xml (added)
+++ stanbol/trunk/data/sites/entity-coref-dbpedia/pom.xml Wed Jul 22 18:58:38 
2015
@@ -0,0 +1,163 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+   Licensed to the Apache Software Foundation (ASF) under one or more
+   contributor license agreements.  See the NOTICE file distributed with
+   this work for additional information regarding copyright ownership.
+   The ASF licenses this file to You under the Apache License, Version 2.0
+   (the "License"); you may not use this file except in compliance with
+   the License.  You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0"; 
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"; 
xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 
http://maven.apache.org/maven-v4_0_0.xsd";>
+
+  <modelVersion>4.0.0</modelVersion>
+
+  <parent>
+    <groupId>org.apache.stanbol</groupId>
+    <artifactId>org.apache.stanbol.data.parent</artifactId>
+    <version>1.2.0-SNAPSHOT</version>
+    <relativePath>../../parent</relativePath>
+  </parent>
+
+  <groupId>org.apache.stanbol</groupId>
+  <artifactId>org.apache.stanbol.data.sites.entity-coref-dbpedia</artifactId>
+  <version>1.2.0-SNAPSHOT</version>
+  <packaging>bundle</packaging>
+
+  <name>Apache Stanbol Data: DBpedia.org and Yago.org</name>
+  <description>
+    This bundle allows to use DBpedia and Yago as Referenced Site for the 
+       Entity Co-reference Engine. The build also downloads the dbpedia index.
+  </description>
+
+  <inceptionYear>2015</inceptionYear>
+  <licenses>
+    <license>
+      <name>Apache Software License, Version 2.0</name>
+      <url>http://www.apache.org/licenses/LICENSE-2.0.txt</url>
+      <distribution>repo</distribution>
+      <comments>A business-friendly OSS license</comments>
+    </license>
+  </licenses>  
+
+  <scm>
+    
<connection>scm:svn:http://svn.apache.org/repos/asf/stanbol/trunk/data/sites/entity-coref-dbpedia</connection>
+    
<developerConnection>scm:svn:https://svn.apache.org/repos/asf/stanbol/trunk/data/sites/entity-coref-dbpedia</developerConnection>
+    <url>http://stanbol.apache.org/</url>
+  </scm>
+
+  <properties>
+    <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding>
+    
<dbpedia.default.index.url>https://github.com/cpetroaca/stanbol-indices/releases/download/trunk/entity-coref-dbpedia.solrindex.zip</dbpedia.default.index.url>
+    
<dbpedia.default.path>org/apache/stanbol/data/site/entity-coref-dbpedia/default</dbpedia.default.path>
+    
<dbpedia.default.index.path>${dbpedia.default.path}/index</dbpedia.default.index.path>
+    
<dbpedia.default.config.path>${dbpedia.default.path}/config</dbpedia.default.config.path>
+    <downloadWarning>
+*                  
+* WARNING - this build downloads a DPBedia index
+* that is *not* licensed under the Apache License, but under the
+* Creative Commons Attribution-ShareAlike 3.0 Unported License.
+*
+    </downloadWarning>    
+  </properties>
+
+  <build>
+    <plugins>
+      <plugin>
+        <groupId>org.apache.felix</groupId>
+        <artifactId>maven-bundle-plugin</artifactId>
+        <inherited>true</inherited>
+        <extensions>true</extensions>
+        <configuration>
+          <instructions>
+            <!-- 
+              Extension used to provide files in that directory to the
+              DataFileProvider
+              -->
+            <Data-Files>${dbpedia.default.index.path}</Data-Files>
+            <!-- 
+              Use a priority lower than 0 to allow providers without a
+              defined ranking to override this default data.
+             -->
+            <Data-Files-Priority>-100</Data-Files-Priority>
+            <!-- 
+              Extension used by the Bundle-Installer to load OSGI 
+              component configuration  
+             -->
+            <Install-Path>${dbpedia.default.config.path}</Install-Path>
+            <_versionpolicy>$${version;===;${@}}</_versionpolicy>
+          </instructions>
+        </configuration>
+      </plugin>
+      <plugin>
+        <groupId>org.apache.maven.plugins</groupId>
+        <artifactId>maven-antrun-plugin</artifactId>
+        <executions>
+          <execution>
+            <id>download</id>
+            <phase>generate-resources</phase>
+            <configuration>
+              <!--
+                TODO: I would like to add an "unless" constraint to the
+                target that prevents execution if Maven operates in offline
+                mode. However I was not able to find out how to obtain this
+                information. ${settings.offline} (as noted by several
+                resources) does not work.
+                Until fixed builds will fail if no internetconnection is
+                available!
+              -->
+              <target>
+                <property name="target.directory" 
value="${project.basedir}/downloads/resources/${dbpedia.default.index.path}" />
+                <property name="index.url" 
value="${dbpedia.default.index.url}" />
+                                
+                <echo message="copy Solr Index " />
+                <echo message=" FROM ${index.url} " />
+                <echo message=" TO ${target.directory}" />
+
+                <ant antfile="${basedir}/download_index.xml">
+                  <target name="download" />
+                </ant>
+              </target>
+            </configuration>
+            <goals>
+              <goal>run</goal>
+            </goals>
+          </execution>
+        </executions>
+      </plugin>
+      <plugin>
+        <groupId>org.apache.rat</groupId>
+        <artifactId>apache-rat-plugin</artifactId>
+        <configuration>
+          <excludes>
+            <!-- AL20 licensed. See src/main/resources/README -->
+            
<exclude>src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/entity-coref-dbpedia.solrindex.ref</exclude>
+            
<exclude>src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.enhancer.engines.entitytagging.impl.NamedEntityTaggingEngine-entity-coref-dbpedia.config</exclude>
+            
<exclude>src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.core.site.CacheImpl-entity-coref-dbpedia.config</exclude>
+            
<exclude>src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.site.referencedSite-entity-coref-dbpedia.config</exclude>
+            
<exclude>src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.yard.solr.impl.SolrYard-entity-coref-dbpedia.config</exclude>
+
+            <!-- Licensed under Creative Commons Attribution-ShareAlike 3.0 
Unported License -->
+            
<exclude>src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/index/entity-coref-dbpedia.solrindex.zip</exclude>
+          </excludes>
+        </configuration>
+      </plugin>
+      <plugin>
+        <groupId>org.apache.maven.plugins</groupId>
+        <artifactId>maven-deploy-plugin</artifactId>
+        <configuration>
+          <!-- DBPedia dumps can be deployed -->
+          <skip>false</skip>
+        </configuration>
+      </plugin>
+    </plugins>
+  </build>
+
+</project>

Added: 
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/appended-resources/META-INF/LICENSE
URL: 
http://svn.apache.org/viewvc/stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/appended-resources/META-INF/LICENSE?rev=1692320&view=auto
==============================================================================
--- 
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/appended-resources/META-INF/LICENSE
 (added)
+++ 
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/appended-resources/META-INF/LICENSE
 Wed Jul 22 18:58:38 2015
@@ -0,0 +1,362 @@
+
+-----------------------------------------------------------------------------
+
+Creative Commons Legal Code
+
+Attribution-ShareAlike 3.0 Unported
+
+    CREATIVE COMMONS CORPORATION IS NOT A LAW FIRM AND DOES NOT PROVIDE
+    LEGAL SERVICES. DISTRIBUTION OF THIS LICENSE DOES NOT CREATE AN
+    ATTORNEY-CLIENT RELATIONSHIP. CREATIVE COMMONS PROVIDES THIS
+    INFORMATION ON AN "AS-IS" BASIS. CREATIVE COMMONS MAKES NO WARRANTIES
+    REGARDING THE INFORMATION PROVIDED, AND DISCLAIMS LIABILITY FOR
+    DAMAGES RESULTING FROM ITS USE.
+
+License
+
+THE WORK (AS DEFINED BELOW) IS PROVIDED UNDER THE TERMS OF THIS CREATIVE
+COMMONS PUBLIC LICENSE ("CCPL" OR "LICENSE"). THE WORK IS PROTECTED BY
+COPYRIGHT AND/OR OTHER APPLICABLE LAW. ANY USE OF THE WORK OTHER THAN AS
+AUTHORIZED UNDER THIS LICENSE OR COPYRIGHT LAW IS PROHIBITED.
+
+BY EXERCISING ANY RIGHTS TO THE WORK PROVIDED HERE, YOU ACCEPT AND AGREE
+TO BE BOUND BY THE TERMS OF THIS LICENSE. TO THE EXTENT THIS LICENSE MAY
+BE CONSIDERED TO BE A CONTRACT, THE LICENSOR GRANTS YOU THE RIGHTS
+CONTAINED HERE IN CONSIDERATION OF YOUR ACCEPTANCE OF SUCH TERMS AND
+CONDITIONS.
+
+1. Definitions
+
+ a. "Adaptation" means a work based upon the Work, or upon the Work and
+    other pre-existing works, such as a translation, adaptation,
+    derivative work, arrangement of music or other alterations of a
+    literary or artistic work, or phonogram or performance and includes
+    cinematographic adaptations or any other form in which the Work may be
+    recast, transformed, or adapted including in any form recognizably
+    derived from the original, except that a work that constitutes a
+    Collection will not be considered an Adaptation for the purpose of
+    this License. For the avoidance of doubt, where the Work is a musical
+    work, performance or phonogram, the synchronization of the Work in
+    timed-relation with a moving image ("synching") will be considered an
+    Adaptation for the purpose of this License.
+ b. "Collection" means a collection of literary or artistic works, such as
+    encyclopedias and anthologies, or performances, phonograms or
+    broadcasts, or other works or subject matter other than works listed
+    in Section 1(f) below, which, by reason of the selection and
+    arrangement of their contents, constitute intellectual creations, in
+    which the Work is included in its entirety in unmodified form along
+    with one or more other contributions, each constituting separate and
+    independent works in themselves, which together are assembled into a
+    collective whole. A work that constitutes a Collection will not be
+    considered an Adaptation (as defined below) for the purposes of this
+    License.
+ c. "Creative Commons Compatible License" means a license that is listed
+    at http://creativecommons.org/compatiblelicenses that has been
+    approved by Creative Commons as being essentially equivalent to this
+    License, including, at a minimum, because that license: (i) contains
+    terms that have the same purpose, meaning and effect as the License
+    Elements of this License; and, (ii) explicitly permits the relicensing
+    of adaptations of works made available under that license under this
+    License or a Creative Commons jurisdiction license with the same
+    License Elements as this License.
+ d. "Distribute" means to make available to the public the original and
+    copies of the Work or Adaptation, as appropriate, through sale or
+    other transfer of ownership.
+ e. "License Elements" means the following high-level license attributes
+    as selected by Licensor and indicated in the title of this License:
+    Attribution, ShareAlike.
+ f. "Licensor" means the individual, individuals, entity or entities that
+    offer(s) the Work under the terms of this License.
+ g. "Original Author" means, in the case of a literary or artistic work,
+    the individual, individuals, entity or entities who created the Work
+    or if no individual or entity can be identified, the publisher; and in
+    addition (i) in the case of a performance the actors, singers,
+    musicians, dancers, and other persons who act, sing, deliver, declaim,
+    play in, interpret or otherwise perform literary or artistic works or
+    expressions of folklore; (ii) in the case of a phonogram the producer
+    being the person or legal entity who first fixes the sounds of a
+    performance or other sounds; and, (iii) in the case of broadcasts, the
+    organization that transmits the broadcast.
+ h. "Work" means the literary and/or artistic work offered under the terms
+    of this License including without limitation any production in the
+    literary, scientific and artistic domain, whatever may be the mode or
+    form of its expression including digital form, such as a book,
+    pamphlet and other writing; a lecture, address, sermon or other work
+    of the same nature; a dramatic or dramatico-musical work; a
+    choreographic work or entertainment in dumb show; a musical
+    composition with or without words; a cinematographic work to which are
+    assimilated works expressed by a process analogous to cinematography;
+    a work of drawing, painting, architecture, sculpture, engraving or
+    lithography; a photographic work to which are assimilated works
+    expressed by a process analogous to photography; a work of applied
+    art; an illustration, map, plan, sketch or three-dimensional work
+    relative to geography, topography, architecture or science; a
+    performance; a broadcast; a phonogram; a compilation of data to the
+    extent it is protected as a copyrightable work; or a work performed by
+    a variety or circus performer to the extent it is not otherwise
+    considered a literary or artistic work.
+ i. "You" means an individual or entity exercising rights under this
+    License who has not previously violated the terms of this License with
+    respect to the Work, or who has received express permission from the
+    Licensor to exercise rights under this License despite a previous
+    violation.
+ j. "Publicly Perform" means to perform public recitations of the Work and
+    to communicate to the public those public recitations, by any means or
+    process, including by wire or wireless means or public digital
+    performances; to make available to the public Works in such a way that
+    members of the public may access these Works from a place and at a
+    place individually chosen by them; to perform the Work to the public
+    by any means or process and the communication to the public of the
+    performances of the Work, including by public digital performance; to
+    broadcast and rebroadcast the Work by any means including signs,
+    sounds or images.
+ k. "Reproduce" means to make copies of the Work by any means including
+    without limitation by sound or visual recordings and the right of
+    fixation and reproducing fixations of the Work, including storage of a
+    protected performance or phonogram in digital form or other electronic
+    medium.
+
+2. Fair Dealing Rights. Nothing in this License is intended to reduce,
+limit, or restrict any uses free from copyright or rights arising from
+limitations or exceptions that are provided for in connection with the
+copyright protection under copyright law or other applicable laws.
+
+3. License Grant. Subject to the terms and conditions of this License,
+Licensor hereby grants You a worldwide, royalty-free, non-exclusive,
+perpetual (for the duration of the applicable copyright) license to
+exercise the rights in the Work as stated below:
+
+ a. to Reproduce the Work, to incorporate the Work into one or more
+    Collections, and to Reproduce the Work as incorporated in the
+    Collections;
+ b. to create and Reproduce Adaptations provided that any such Adaptation,
+    including any translation in any medium, takes reasonable steps to
+    clearly label, demarcate or otherwise identify that changes were made
+    to the original Work. For example, a translation could be marked "The
+    original work was translated from English to Spanish," or a
+    modification could indicate "The original work has been modified.";
+ c. to Distribute and Publicly Perform the Work including as incorporated
+    in Collections; and,
+ d. to Distribute and Publicly Perform Adaptations.
+ e. For the avoidance of doubt:
+
+     i. Non-waivable Compulsory License Schemes. In those jurisdictions in
+        which the right to collect royalties through any statutory or
+        compulsory licensing scheme cannot be waived, the Licensor
+        reserves the exclusive right to collect such royalties for any
+        exercise by You of the rights granted under this License;
+    ii. Waivable Compulsory License Schemes. In those jurisdictions in
+        which the right to collect royalties through any statutory or
+        compulsory licensing scheme can be waived, the Licensor waives the
+        exclusive right to collect such royalties for any exercise by You
+        of the rights granted under this License; and,
+   iii. Voluntary License Schemes. The Licensor waives the right to
+        collect royalties, whether individually or, in the event that the
+        Licensor is a member of a collecting society that administers
+        voluntary licensing schemes, via that society, from any exercise
+        by You of the rights granted under this License.
+
+The above rights may be exercised in all media and formats whether now
+known or hereafter devised. The above rights include the right to make
+such modifications as are technically necessary to exercise the rights in
+other media and formats. Subject to Section 8(f), all rights not expressly
+granted by Licensor are hereby reserved.
+
+4. Restrictions. The license granted in Section 3 above is expressly made
+subject to and limited by the following restrictions:
+
+ a. You may Distribute or Publicly Perform the Work only under the terms
+    of this License. You must include a copy of, or the Uniform Resource
+    Identifier (URI) for, this License with every copy of the Work You
+    Distribute or Publicly Perform. You may not offer or impose any terms
+    on the Work that restrict the terms of this License or the ability of
+    the recipient of the Work to exercise the rights granted to that
+    recipient under the terms of the License. You may not sublicense the
+    Work. You must keep intact all notices that refer to this License and
+    to the disclaimer of warranties with every copy of the Work You
+    Distribute or Publicly Perform. When You Distribute or Publicly
+    Perform the Work, You may not impose any effective technological
+    measures on the Work that restrict the ability of a recipient of the
+    Work from You to exercise the rights granted to that recipient under
+    the terms of the License. This Section 4(a) applies to the Work as
+    incorporated in a Collection, but this does not require the Collection
+    apart from the Work itself to be made subject to the terms of this
+    License. If You create a Collection, upon notice from any Licensor You
+    must, to the extent practicable, remove from the Collection any credit
+    as required by Section 4(c), as requested. If You create an
+    Adaptation, upon notice from any Licensor You must, to the extent
+    practicable, remove from the Adaptation any credit as required by
+    Section 4(c), as requested.
+ b. You may Distribute or Publicly Perform an Adaptation only under the
+    terms of: (i) this License; (ii) a later version of this License with
+    the same License Elements as this License; (iii) a Creative Commons
+    jurisdiction license (either this or a later license version) that
+    contains the same License Elements as this License (e.g.,
+    Attribution-ShareAlike 3.0 US)); (iv) a Creative Commons Compatible
+    License. If you license the Adaptation under one of the licenses
+    mentioned in (iv), you must comply with the terms of that license. If
+    you license the Adaptation under the terms of any of the licenses
+    mentioned in (i), (ii) or (iii) (the "Applicable License"), you must
+    comply with the terms of the Applicable License generally and the
+    following provisions: (I) You must include a copy of, or the URI for,
+    the Applicable License with every copy of each Adaptation You
+    Distribute or Publicly Perform; (II) You may not offer or impose any
+    terms on the Adaptation that restrict the terms of the Applicable
+    License or the ability of the recipient of the Adaptation to exercise
+    the rights granted to that recipient under the terms of the Applicable
+    License; (III) You must keep intact all notices that refer to the
+    Applicable License and to the disclaimer of warranties with every copy
+    of the Work as included in the Adaptation You Distribute or Publicly
+    Perform; (IV) when You Distribute or Publicly Perform the Adaptation,
+    You may not impose any effective technological measures on the
+    Adaptation that restrict the ability of a recipient of the Adaptation
+    from You to exercise the rights granted to that recipient under the
+    terms of the Applicable License. This Section 4(b) applies to the
+    Adaptation as incorporated in a Collection, but this does not require
+    the Collection apart from the Adaptation itself to be made subject to
+    the terms of the Applicable License.
+ c. If You Distribute, or Publicly Perform the Work or any Adaptations or
+    Collections, You must, unless a request has been made pursuant to
+    Section 4(a), keep intact all copyright notices for the Work and
+    provide, reasonable to the medium or means You are utilizing: (i) the
+    name of the Original Author (or pseudonym, if applicable) if supplied,
+    and/or if the Original Author and/or Licensor designate another party
+    or parties (e.g., a sponsor institute, publishing entity, journal) for
+    attribution ("Attribution Parties") in Licensor's copyright notice,
+    terms of service or by other reasonable means, the name of such party
+    or parties; (ii) the title of the Work if supplied; (iii) to the
+    extent reasonably practicable, the URI, if any, that Licensor
+    specifies to be associated with the Work, unless such URI does not
+    refer to the copyright notice or licensing information for the Work;
+    and (iv) , consistent with Ssection 3(b), in the case of an
+    Adaptation, a credit identifying the use of the Work in the Adaptation
+    (e.g., "French translation of the Work by Original Author," or
+    "Screenplay based on original Work by Original Author"). The credit
+    required by this Section 4(c) may be implemented in any reasonable
+    manner; provided, however, that in the case of a Adaptation or
+    Collection, at a minimum such credit will appear, if a credit for all
+    contributing authors of the Adaptation or Collection appears, then as
+    part of these credits and in a manner at least as prominent as the
+    credits for the other contributing authors. For the avoidance of
+    doubt, You may only use the credit required by this Section for the
+    purpose of attribution in the manner set out above and, by exercising
+    Your rights under this License, You may not implicitly or explicitly
+    assert or imply any connection with, sponsorship or endorsement by the
+    Original Author, Licensor and/or Attribution Parties, as appropriate,
+    of You or Your use of the Work, without the separate, express prior
+    written permission of the Original Author, Licensor and/or Attribution
+    Parties.
+ d. Except as otherwise agreed in writing by the Licensor or as may be
+    otherwise permitted by applicable law, if You Reproduce, Distribute or
+    Publicly Perform the Work either by itself or as part of any
+    Adaptations or Collections, You must not distort, mutilate, modify or
+    take other derogatory action in relation to the Work which would be
+    prejudicial to the Original Author's honor or reputation. Licensor
+    agrees that in those jurisdictions (e.g. Japan), in which any exercise
+    of the right granted in Section 3(b) of this License (the right to
+    make Adaptations) would be deemed to be a distortion, mutilation,
+    modification or other derogatory action prejudicial to the Original
+    Author's honor and reputation, the Licensor will waive or not assert,
+    as appropriate, this Section, to the fullest extent permitted by the
+    applicable national law, to enable You to reasonably exercise Your
+    right under Section 3(b) of this License (right to make Adaptations)
+    but not otherwise.
+
+5. Representations, Warranties and Disclaimer
+
+UNLESS OTHERWISE MUTUALLY AGREED TO BY THE PARTIES IN WRITING, LICENSOR
+OFFERS THE WORK AS-IS AND MAKES NO REPRESENTATIONS OR WARRANTIES OF ANY
+KIND CONCERNING THE WORK, EXPRESS, IMPLIED, STATUTORY OR OTHERWISE,
+INCLUDING, WITHOUT LIMITATION, WARRANTIES OF TITLE, MERCHANTIBILITY,
+FITNESS FOR A PARTICULAR PURPOSE, NONINFRINGEMENT, OR THE ABSENCE OF
+LATENT OR OTHER DEFECTS, ACCURACY, OR THE PRESENCE OF ABSENCE OF ERRORS,
+WHETHER OR NOT DISCOVERABLE. SOME JURISDICTIONS DO NOT ALLOW THE EXCLUSION
+OF IMPLIED WARRANTIES, SO SUCH EXCLUSION MAY NOT APPLY TO YOU.
+
+6. Limitation on Liability. EXCEPT TO THE EXTENT REQUIRED BY APPLICABLE
+LAW, IN NO EVENT WILL LICENSOR BE LIABLE TO YOU ON ANY LEGAL THEORY FOR
+ANY SPECIAL, INCIDENTAL, CONSEQUENTIAL, PUNITIVE OR EXEMPLARY DAMAGES
+ARISING OUT OF THIS LICENSE OR THE USE OF THE WORK, EVEN IF LICENSOR HAS
+BEEN ADVISED OF THE POSSIBILITY OF SUCH DAMAGES.
+
+7. Termination
+
+ a. This License and the rights granted hereunder will terminate
+    automatically upon any breach by You of the terms of this License.
+    Individuals or entities who have received Adaptations or Collections
+    from You under this License, however, will not have their licenses
+    terminated provided such individuals or entities remain in full
+    compliance with those licenses. Sections 1, 2, 5, 6, 7, and 8 will
+    survive any termination of this License.
+ b. Subject to the above terms and conditions, the license granted here is
+    perpetual (for the duration of the applicable copyright in the Work).
+    Notwithstanding the above, Licensor reserves the right to release the
+    Work under different license terms or to stop distributing the Work at
+    any time; provided, however that any such election will not serve to
+    withdraw this License (or any other license that has been, or is
+    required to be, granted under the terms of this License), and this
+    License will continue in full force and effect unless terminated as
+    stated above.
+
+8. Miscellaneous
+
+ a. Each time You Distribute or Publicly Perform the Work or a Collection,
+    the Licensor offers to the recipient a license to the Work on the same
+    terms and conditions as the license granted to You under this License.
+ b. Each time You Distribute or Publicly Perform an Adaptation, Licensor
+    offers to the recipient a license to the original Work on the same
+    terms and conditions as the license granted to You under this License.
+ c. If any provision of this License is invalid or unenforceable under
+    applicable law, it shall not affect the validity or enforceability of
+    the remainder of the terms of this License, and without further action
+    by the parties to this agreement, such provision shall be reformed to
+    the minimum extent necessary to make such provision valid and
+    enforceable.
+ d. No term or provision of this License shall be deemed waived and no
+    breach consented to unless such waiver or consent shall be in writing
+    and signed by the party to be charged with such waiver or consent.
+ e. This License constitutes the entire agreement between the parties with
+    respect to the Work licensed here. There are no understandings,
+    agreements or representations with respect to the Work not specified
+    here. Licensor shall not be bound by any additional provisions that
+    may appear in any communication from You. This License may not be
+    modified without the mutual written agreement of the Licensor and You.
+ f. The rights granted under, and the subject matter referenced, in this
+    License were drafted utilizing the terminology of the Berne Convention
+    for the Protection of Literary and Artistic Works (as amended on
+    September 28, 1979), the Rome Convention of 1961, the WIPO Copyright
+    Treaty of 1996, the WIPO Performances and Phonograms Treaty of 1996
+    and the Universal Copyright Convention (as revised on July 24, 1971).
+    These rights and subject matter take effect in the relevant
+    jurisdiction in which the License terms are sought to be enforced
+    according to the corresponding provisions of the implementation of
+    those treaty provisions in the applicable national law. If the
+    standard suite of rights granted under applicable copyright law
+    includes additional rights not granted under this License, such
+    additional rights are deemed to be included in the License; this
+    License is not intended to restrict the license of any rights under
+    applicable law.
+
+
+Creative Commons Notice
+
+    Creative Commons is not a party to this License, and makes no warranty
+    whatsoever in connection with the Work. Creative Commons will not be
+    liable to You or any party on any legal theory for any damages
+    whatsoever, including without limitation any general, special,
+    incidental or consequential damages arising in connection to this
+    license. Notwithstanding the foregoing two (2) sentences, if Creative
+    Commons has expressly identified itself as the Licensor hereunder, it
+    shall have all rights and obligations of Licensor.
+
+    Except for the limited purpose of indicating to the public that the
+    Work is licensed under the CCPL, Creative Commons does not authorize
+    the use by either party of the trademark "Creative Commons" or any
+    related trademark or logo of Creative Commons without the prior
+    written consent of Creative Commons. Any permitted use will be in
+    compliance with Creative Commons' then-current trademark usage
+    guidelines, as may be published on its website or otherwise made
+    available upon request from time to time. For the avoidance of doubt,
+    this trademark restriction does not form part of the License.
+
+    Creative Commons may be contacted at http://creativecommons.org/.
\ No newline at end of file

Added: 
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/appended-resources/META-INF/NOTICE
URL: 
http://svn.apache.org/viewvc/stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/appended-resources/META-INF/NOTICE?rev=1692320&view=auto
==============================================================================
--- 
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/appended-resources/META-INF/NOTICE
 (added)
+++ 
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/appended-resources/META-INF/NOTICE
 Wed Jul 22 18:58:38 2015
@@ -0,0 +1,3 @@
+This product contains an index from DBPedia licensed under
+the Creative Commons Attribution-ShareAlike 3.0 Unported License
+http://creativecommons.org/licenses/by-sa/3.0/
\ No newline at end of file

Added: stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/README
URL: 
http://svn.apache.org/viewvc/stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/README?rev=1692320&view=auto
==============================================================================
--- stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/README 
(added)
+++ stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/README Wed 
Jul 22 18:58:38 2015
@@ -0,0 +1,25 @@
+Licensed to the Apache Software Foundation (ASF) under one or more
+contributor license agreements.  See the NOTICE file distributed with
+this work for additional information regarding copyright ownership.
+The ASF licenses this file to You under the Apache License, Version 2.0
+(the "License"); you may not use this file except in compliance with
+the License.  You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
+
+The following files are provided under the Apache License, Version 2.0:
+
+org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/entity-coref-dbpedia.solrindex.ref
+org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.core.site.CacheImpl-entity-coref-dbpedia.config
+org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.site.referencedSite-entity-coref-dbpedia.config
+org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.yard.solr.impl.SolrYard-entity-coref-dbpedia.config
+
+The following file is licensed under Creative Commons Attribution-ShareAlike 
3.0 Unported License:
+
+org/apache/stanbol/data/site/dbpedia/default/index/entity-coref-dbpedia.solrindex.zip

Added: 
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/entity-coref-dbpedia.solrindex.ref
URL: 
http://svn.apache.org/viewvc/stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/entity-coref-dbpedia.solrindex.ref?rev=1692320&view=auto
==============================================================================
--- 
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/entity-coref-dbpedia.solrindex.ref
 (added)
+++ 
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/entity-coref-dbpedia.solrindex.ref
 Wed Jul 22 18:58:38 2015
@@ -0,0 +1,5 @@
+#Tue Feb 03 20:20:31 EET 2015
+Name=SolrIndex for entity-coref-dbpedia
+Synchronized=true
+Description=DBpedia.org 
+Index-Archive=entity-coref-dbpedia.solrindex.zip

Added: 
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.core.site.CacheImpl-entity-coref-dbpedia.config
URL: 
http://svn.apache.org/viewvc/stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.core.site.CacheImpl-entity-coref-dbpedia.config?rev=1692320&view=auto
==============================================================================
--- 
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.core.site.CacheImpl-entity-coref-dbpedia.config
 (added)
+++ 
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.core.site.CacheImpl-entity-coref-dbpedia.config
 Wed Jul 22 18:58:38 2015
@@ -0,0 +1,4 @@
+org.apache.stanbol.entityhub.yard.name="entity-coref-dbpedia\ Cache"
+org.apache.stanbol.entityhub.yard.cacheYardId="entity-coref-dbpediaIndex"
+org.apache.stanbol.entityhub.yard.id="entity-coref-dbpediaIndex"
+org.apache.stanbol.entityhub.yard.description="Cache\ for\ the\ 
entity-coref-dbpedia\ Referenced\ Site\ using\ the\ entity-coref-dbpediaIndex."

Added: 
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.site.referencedSite-entity-coref-dbpedia.config
URL: 
http://svn.apache.org/viewvc/stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.site.referencedSite-entity-coref-dbpedia.config?rev=1692320&view=auto
==============================================================================
--- 
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.site.referencedSite-entity-coref-dbpedia.config
 (added)
+++ 
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.site.referencedSite-entity-coref-dbpedia.config
 Wed Jul 22 18:58:38 2015
@@ -0,0 +1,9 @@
+org.apache.stanbol.entityhub.site.defaultExpireDuration=I"0"
+org.apache.stanbol.entityhub.site.cacheId="entity-coref-dbpediaIndex"
+org.apache.stanbol.entityhub.site.defaultSymbolState="proposed"
+org.apache.stanbol.entityhub.site.name="entity-coref-dbpedia"
+org.apache.stanbol.entityhub.site.id="entity-coref-dbpedia"
+org.apache.stanbol.entityhub.site.description="DBpedia.org\ "
+org.apache.stanbol.entityhub.site.defaultMappedEntityState="proposed"
+org.apache.stanbol.entityhub.site.fieldMappings=("#\ Licensed\ to\ the\ 
Apache\ Software\ Foundation\ (ASF)\ under\ one\ or\ more","#\ contributor\ 
license\ agreements.\ \ See\ the\ NOTICE\ file\ distributed\ with","#\ this\ 
work\ for\ additional\ information\ regarding\ copyright\ ownership.","#\ The\ 
ASF\ licenses\ this\ file\ to\ You\ under\ the\ Apache\ License,\ Version\ 
2.0","#\ (the\ \"License\");\ you\ may\ not\ use\ this\ file\ except\ in\ 
compliance\ with","#\ the\ License.\ \ You\ may\ obtain\ a\ copy\ of\ the\ 
License\ at","#","#\ \ \ \ \ 
http://www.apache.org/licenses/LICENSE-2.0","#","#\ Unless\ required\ by\ 
applicable\ law\ or\ agreed\ to\ in\ writing,\ software","#\ distributed\ 
under\ the\ License\ is\ distributed\ on\ an\ \"AS\ IS\"\ BASIS,","#\ WITHOUT\ 
WARRANTIES\ OR\ CONDITIONS\ OF\ ANY\ KIND,\ either\ express\ or\ implied.","#\ 
See\ the\ License\ for\ the\ specific\ language\ governing\ permissions\ 
and","#\ limitations\ under\ the\ License.","#","#NOTE:\ THIS
 \ IS\ A\ DEFAULT\ MAPPING\ SPECIFICATION\ THAT\ INCLUDES\ MAPPINGS\ FOR","#\ \ 
\ \ \ \ COMMON\ ONTOLOGIES.\ USERS\ MIGHT\ WANT\ TO\ ADAPT\ THIS\ 
CONFIGURATION\ BY","#\ \ \ \ \ \ COMMENTING/UNCOMMENTING\ AND/OR\ ADDING\ NEW\ 
MAPPINGS","","#\ ---\ Define\ the\ Languages\ for\ all\ fields\ ---","#\ to\ 
restrict\ languages\ to\ be\ imported\ (for\ all\ fields)","#|\ 
@\=null;en;de;fr;it","","#NOTE:\ null\ is\ used\ to\ import\ labels\ with\ no\ 
specified\ language","","#\ ---\ Define\ the\ Languages\ for\ all\ fields\ 
---","#\ Uncomment\ to\ restrict\ indexing\ to\ a\ specific\ list\ of\ 
languages,\ otherwise\ all","#\ languages\ are\ indexed","#|\ 
@\=null;en;de;fr;it","","#\ ---\ RDF\ RDFS\ and\ OWL\ Mappings\ ---","#\ This\ 
configuration\ only\ index\ properties\ that\ are\ typically\ used\ to\ 
store","#\ instance\ data\ defined\ by\ such\ namespaces.\ This\ excludes\ 
ontology\ definitions","","#\ NOTE\ that\ nearly\ all\ other\ ontologies\ are\ 
are\ using\ properties\ of\ these\ three
 ","#\ \ \ \ \ \ schemas,\ therefore\ it\ is\ strongly\ recommended\ to\ 
include\ such\ information!","","#rdf:type\ |\ 
d\=entityhub:ref","","rdfs:label\ ","#rdfs:comment","#rdfs:seeAlso\ |\ 
d\=entityhub:ref","","","#owl:sameAs\ |\ d\=entityhub:ref","","#If\ one\ likes\ 
to\ also\ index\ ontologies\ one\ should\ add\ the\ following\ 
statements","#owl:*","#rdfs:*","","#\ ---\ Dublin\ Core\ (DC)\ ---","#\ The\ 
default\ configuration\ imports\ all\ dc-terms\ data\ and\ copies\ values\ for\ 
the","#\ old\ dc-elements\ standard\ over\ to\ the\ according\ properties\ of\ 
the\ dc-terms","#\ standard.","","#\ NOTE\ that\ a\ lot\ of\ other\ ontologies\ 
are\ also\ using\ DC\ for\ some\ of\ there\ data","#\ \ \ \ \ \ therefore\ it\ 
is\ strongly\ recommended\ to\ include\ such\ information!","","#mapping\ for\ 
all\ dc-terms\ properties","#dc:*","","#\ copy\ dc:title\ to\ 
rdfs:label","#dc:title\ >\ rdfs:label","","#\ deactivated\ by\ default,\ 
because\ such\ mappings\ are\ mapped\ to\ dc-terms","#d
 c-elements:*","","#\ mappings\ for\ the\ dc-elements\ properties\ to\ the\ 
dc-terms","#dc-elements:contributor\ >\ dc:contributor","#dc-elements:coverage\ 
>\ dc:coverage","#dc-elements:creator\ >\ dc:creator","#dc-elements:date\ >\ 
dc:date","#dc-elements:description\ >\ dc:description","#dc-elements:format\ >\ 
dc:format","#dc-elements:identifier\ >\ dc:identifier","#dc-elements:language\ 
>\ dc:language","#dc-elements:publisher\ >\ 
dc:publisher","#dc-elements:relation\ >\ dc:relation","#dc-elements:rights\ >\ 
dc:rights","#dc-elements:source\ >\ dc:source","#dc-elements:subject\ >\ 
dc:subject","#dc-elements:title\ >\ dc:title","#dc-elements:type\ >\ 
dc:type","#also\ use\ dc-elements:title\ as\ label","#dc-elements:title\ >\ 
rdfs:label","","#\ ---\ Social\ Networks\ (via\ foaf)\ ---","#The\ Friend\ of\ 
a\ Friend\ schema\ is\ often\ used\ to\ describe\ social\ relations\ between\ 
people","#foaf:*","","#\ copy\ the\ name\ of\ a\ person\ over\ to\ 
rdfs:label","#foaf:name\ >\ rdfs:label","
 ","#\ additional\ data\ types\ checks","#foaf:knows\ |\ 
d\=entityhub:ref","#foaf:made\ |\ d\=entityhub:ref","#foaf:maker\ |\ 
d\=entityhub:ref","#foaf:member\ |\ d\=entityhub:ref","#foaf:homepage\ |\ 
d\=xsd:anyURI","#foaf:depiction\ |\ d\=xsd:anyURI","#foaf:img\ |\ 
d\=xsd:anyURI","#foaf:logo\ |\ d\=xsd:anyURI","#page\ about\ the\ 
entity","#foaf:page\ |\ d\=xsd:anyURI","","","#\ ---\ Schema.org\ --","","#\ 
Defines\ an\ Ontology\ used\ by\ search\ engines\ (Google,\ Yahoo\ and\ Bing)\ 
for\ ","#\ indexing\ websites.","","#schema:*","#\ Copy\ all\ names\ of\ 
schema\ instances\ over\ to\ rdfs:label","#schema:name\ >\ rdfs:label","","#\ 
---\ Simple\ Knowledge\ Organization\ System\ (SKOS)\ ---","","#\ A\ common\ 
data\ model\ for\ sharing\ and\ linking\ knowledge\ organization\ systems\ 
","#\ via\ the\ Semantic\ Web.\ Typically\ used\ to\ encode\ controlled\ 
vocabularies\ as","#\ a\ thesaurus\ \ ","#skos:*","","#\ copy\ all\ SKOS\ 
labels\ (preferred,\ alternative\ and\ hidden)\ over\ to\ rd
 fs:label","#skos:prefLabel\ >\ rdfs:label","#skos:altLabel\ >\ 
rdfs:label","#skos:hiddenLabel\ >\ rdfs:label","","#\ copy\ values\ of\ 
**Match\ relations\ to\ the\ according\ related,\ broader\ and\ 
narrower","#skos:relatedMatch\ >\ skos:related","#skos:broadMatch\ >\ 
skos:broader","#skos:narrowMatch\ >\ skos:skos:narrower","","#similar\ 
mappings\ for\ transitive\ variants\ are\ not\ contained,\ because\ 
transitive","#reasoning\ is\ not\ directly\ supported\ by\ the\ 
Entityhub.","","#\ Some\ SKOS\ thesaurus\ do\ use\ \"skos:transitiveBroader\"\ 
and\ \"skos:transitiveNarrower\"","#\ however\ such\ properties\ are\ only\ 
intended\ to\ be\ used\ by\ reasoners\ to","#\ calculate\ transitive\ closures\ 
over\ broader/narrower\ hierarchies.","#\ see\ 
http://www.w3.org/TR/skos-reference/#L2413\ for\ details","#\ to\ correct\ 
such\ cases\ we\ will\ copy\ transitive\ relations\ to\ their\ 
counterpart","#skos:narrowerTransitive\ >\ 
skos:narrower","#skos:broaderTransitive\ >\ skos:broader","","
 ","#\ ---\ Semantically-Interlinked\ Online\ Communities\ (SIOC)\ ---","","#\ 
An\ ontology\ for\ describing\ the\ information\ in\ online\ communities.\ 
","#\ This\ information\ can\ be\ used\ to\ export\ information\ from\ online\ 
communities\ ","#\ and\ to\ link\ them\ together.\ The\ scope\ of\ the\ 
application\ areas\ that\ SIOC\ can\ ","#\ be\ used\ for\ includes\ (and\ is\ 
not\ limited\ to)\ weblogs,\ message\ boards,\ ","#\ mailing\ lists\ and\ chat\ 
channels.","#sioc:*","","#\ ---\ biographical\ information\ (bio)","#\ A\ 
vocabulary\ for\ describing\ biographical\ information\ about\ people,\ both\ 
living","#\ and\ dead.\ (see\ http://vocab.org/bio/0.1/)","#bio:*","","#\ ---\ 
Rich\ Site\ Summary\ (rss)\ ---","#rss:*","","#\ ---\ GoodRelations\ (gr)\ 
---","#\ GoodRelations\ is\ a\ standardised\ vocabulary\ for\ product,\ price,\ 
and\ company\ data","#gr:*","","#\ ---\ Creative\ Commons\ Rights\ Expression\ 
Language\ (cc)","#\ The\ Creative\ Commons\ Rights\ Expression\ Langua
 ge\ (CC\ REL)\ lets\ you\ describe\ ","#\ copyright\ licenses\ in\ 
RDF.","#cc:*","","","","","","")
+org.apache.stanbol.entityhub.site.cacheStrategy="all"

Added: 
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.yard.solr.impl.SolrYard-entity-coref-dbpedia.config
URL: 
http://svn.apache.org/viewvc/stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.yard.solr.impl.SolrYard-entity-coref-dbpedia.config?rev=1692320&view=auto
==============================================================================
--- 
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.yard.solr.impl.SolrYard-entity-coref-dbpedia.config
 (added)
+++ 
stanbol/trunk/data/sites/entity-coref-dbpedia/src/main/resources/org/apache/stanbol/data/site/entity-coref-dbpedia/default/config/org.apache.stanbol.entityhub.yard.solr.impl.SolrYard-entity-coref-dbpedia.config
 Wed Jul 22 18:58:38 2015
@@ -0,0 +1,7 @@
+org.apache.stanbol.entityhub.yard.solr.solrUri="entity-coref-dbpedia"
+org.apache.stanbol.entityhub.yard.name="entity-coref-dbpedia\ Index"
+org.apache.stanbol.entityhub.yard.solr.multiYardIndexLayout=B"false"
+org.apache.stanbol.entityhub.yard.solr.useDefaultConfig=B"false"
+org.apache.stanbol.entityhub.yard.id="entity-coref-dbpediaIndex"
+http://stanbol.apache.org/ontology/entityhub/entityhub#entityRank="http://stanbol.apache.org/ontology/entityhub/entityhub#entityRank";
+org.apache.stanbol.entityhub.yard.description="Full\ local\ index\ for\ the\ 
Referenced\ Site\ \"entity-coref-dbpedia\"."

Added: stanbol/trunk/enhancement-engines/entitycoreference/README.md
URL: 
http://svn.apache.org/viewvc/stanbol/trunk/enhancement-engines/entitycoreference/README.md?rev=1692320&view=auto
==============================================================================
--- stanbol/trunk/enhancement-engines/entitycoreference/README.md (added)
+++ stanbol/trunk/enhancement-engines/entitycoreference/README.md Wed Jul 22 
18:58:38 2015
@@ -0,0 +1,42 @@
+<!-- 
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+
+      http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+
+# Entity Co-reference Engine
+
+The Entity co-reference Engine performs co-reference resolution of Named 
Entities in a given text. 
+The co-references will be noun phrases which refer to those Named Entities by 
having a minimal set of attributes which match 
+contextual information (rdf:type of the entity and spatial and object function 
giving info) from entity repositories
+such as Dbpedia and Yago for that Named Entity.
+
+We have the following text as an example : "Microsoft has posted its 2013 
earnings. The software company did better than expected. ... The Redmond-based 
company will hire 500 new developers this year."
+The enhancement engine will link "Microsoft" with "The software company" and 
"The Redmond-based company".
+
+## (1) Configuring the Engine
+TODO
+
+## (2) Running the Entity co-reference engine in Stanbol.
+
+In order to run the engine you need to add it to a chain that also contains 
the following engine types:
+- a language detection engine
+- a sentence detection engine (like opennlp-sentence)
+- a token detection engine (like opennlp-token)
+- a NER detection engine (like opennlp-ner)
+- a noun phrase detection engine (like pos-chunker)
+
+The default data bundle which contains dbpedia and yago data with which the 
coreferencing is done is the entity-coref-dbpedia data bundle.
+You can find the bundle in data/sites/entity-coref-dbpedia. Install this 
bundle into Stanbol.
+You can create your own data bundle but be sure to input the correct 
attributes when configuring the engine(see point no 1).

Added: stanbol/trunk/enhancement-engines/entitycoreference/pom.xml
URL: 
http://svn.apache.org/viewvc/stanbol/trunk/enhancement-engines/entitycoreference/pom.xml?rev=1692320&view=auto
==============================================================================
--- stanbol/trunk/enhancement-engines/entitycoreference/pom.xml (added)
+++ stanbol/trunk/enhancement-engines/entitycoreference/pom.xml Wed Jul 22 
18:58:38 2015
@@ -0,0 +1,129 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+   Licensed to the Apache Software Foundation (ASF) under one or more
+   contributor license agreements.  See the NOTICE file distributed with
+   this work for additional information regarding copyright ownership.
+   The ASF licenses this file to You under the Apache License, Version 2.0
+   (the "License"); you may not use this file except in compliance with
+   the License.  You may obtain a copy of the License at
+
+        http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
+-->
+<project xmlns="http://maven.apache.org/POM/4.0.0"; 
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"; 
xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 
http://maven.apache.org/maven-v4_0_0.xsd";>
+
+  <modelVersion>4.0.0</modelVersion>
+
+  <parent>
+    <groupId>org.apache.stanbol</groupId>
+    <artifactId>apache-stanbol-enhancement-engines</artifactId>
+    <version>1.0.0-SNAPSHOT</version>
+    <relativePath>..</relativePath>
+  </parent>
+
+  <groupId>org.apache.stanbol</groupId>
+  
<artifactId>org.apache.stanbol.enhancer.engines.entitycoreference</artifactId>
+  <version>1.0.0-SNAPSHOT</version>
+  <packaging>bundle</packaging>
+
+  <name>Apache Stanbol Enhancement Engine : Entity Co-Reference</name>
+  <description>
+    An Engine that finds co-references of Named Entities based on 
+       dbpedia/yago concepts.
+  </description>
+
+  <inceptionYear>2014</inceptionYear>
+
+  <scm>
+    <connection>
+      
scm:svn:http://svn.apache.org/repos/asf/stanbol/trunk/enhancement-engines/entitycoreference/
+    </connection>
+    <developerConnection>
+      
scm:svn:https://svn.apache.org/repos/asf/stanbol/trunk/enhancement-engines/entitycoreference/
+    </developerConnection>
+    <url>http://stanbol.apache.org/</url>
+  </scm>
+
+  <build>
+    <plugins>
+      <plugin>
+        <groupId>org.apache.felix</groupId>
+        <artifactId>maven-bundle-plugin</artifactId>
+        <extensions>true</extensions>
+        <configuration>
+          <instructions>
+            <Import-Package>
+              org.apache.stanbol.enhancer.servicesapi; provide:=true; 
version="[0.11,1.1)",
+              
org.apache.stanbol.enhancer.engines.entitylinking;version=${project.version}; 
provide:=true,
+              *
+            </Import-Package>
+            <Private-Package>
+              
org.apache.stanbol.enhancer.engines.entitycoreference.*;version=${project.version}
+            </Private-Package>
+          </instructions>
+        </configuration>
+      </plugin>
+      <plugin>
+        <groupId>org.apache.felix</groupId>
+        <artifactId>maven-scr-plugin</artifactId>
+      </plugin>
+          <plugin>
+          <groupId>org.apache.maven.plugins</groupId>
+          <artifactId>maven-compiler-plugin</artifactId>
+          <version>3.1</version>
+          <configuration>
+            <source>1.7</source>
+            <target>1.7</target>
+          </configuration>
+        </plugin>
+    </plugins>
+  </build>
+
+  <dependencies>
+    <dependency>
+      <groupId>org.apache.stanbol</groupId>
+      
<artifactId>org.apache.stanbol.commons.namespaceprefix.service</artifactId>
+      <version>1.0.0-SNAPSHOT</version>
+    </dependency>
+
+       <dependency>
+      <groupId>org.apache.stanbol</groupId>
+      
<artifactId>org.apache.stanbol.enhancer.engines.entitylinking.engine</artifactId>
+      <version>1.0.0-SNAPSHOT</version>
+    </dependency>
+    
+    <dependency>
+      <groupId>org.apache.stanbol</groupId>
+      <artifactId>org.apache.stanbol.entityhub.servicesapi</artifactId>
+      <version>1.0.0-SNAPSHOT</version>
+    </dependency>
+
+    <dependency>
+      <groupId>org.apache.felix</groupId>
+      <artifactId>org.apache.felix.scr.annotations</artifactId>
+    </dependency>
+    <dependency>
+      <groupId>org.slf4j</groupId>
+      <artifactId>slf4j-api</artifactId>
+    </dependency>
+    
+    <!-- Test dependencies -->
+    <dependency>
+      <groupId>junit</groupId>
+      <artifactId>junit</artifactId>
+      <scope>test</scope>      
+    </dependency>
+    <dependency>  <!-- used for debug level logging during tests -->
+      <groupId>org.slf4j</groupId>
+      <artifactId>slf4j-log4j12</artifactId>
+      <scope>test</scope>
+    </dependency>
+
+  </dependencies>
+
+</project>

Added: 
stanbol/trunk/enhancement-engines/entitycoreference/src/license/THIRD-PARTY.properties
URL: 
http://svn.apache.org/viewvc/stanbol/trunk/enhancement-engines/entitycoreference/src/license/THIRD-PARTY.properties?rev=1692320&view=auto
==============================================================================
--- 
stanbol/trunk/enhancement-engines/entitycoreference/src/license/THIRD-PARTY.properties
 (added)
+++ 
stanbol/trunk/enhancement-engines/entitycoreference/src/license/THIRD-PARTY.properties
 Wed Jul 22 18:58:38 2015
@@ -0,0 +1,24 @@
+# Generated by org.codehaus.mojo.license.AddThirdPartyMojo
+#-------------------------------------------------------------------------------
+# Already used licenses in project :
+# - Apache Software License
+# - Apache Software License, Version 2.0
+# - BSD License
+# - Common Development And Distribution License (CDDL), Version 1.0
+# - Common Development And Distribution License (CDDL), Version 1.1
+# - Common Public License, Version 1.0
+# - Eclipse Public License, Version 1.0
+# - GNU General Public License (GPL), Version 2 with classpath exception
+# - GNU Lesser General Public License (LGPL)
+# - GNU Lesser General Public License (LGPL), Version 2.1
+# - ICU License
+# - MIT License
+# - New BSD License
+# - Public Domain License
+#-------------------------------------------------------------------------------
+# Please fill the missing licenses for dependencies :
+#
+#
+#Tue Jul 23 16:41:35 CEST 2013
+org.osgi--org.osgi.compendium--4.1.0=The Apache Software License, Version 2.0
+org.osgi--org.osgi.core--4.1.0=The Apache Software License, Version 2.0

Added: 
stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/apache/stanbol/enhancer/engines/entitycoreference/Constants.java
URL: 
http://svn.apache.org/viewvc/stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/apache/stanbol/enhancer/engines/entitycoreference/Constants.java?rev=1692320&view=auto
==============================================================================
--- 
stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/apache/stanbol/enhancer/engines/entitycoreference/Constants.java
 (added)
+++ 
stanbol/trunk/enhancement-engines/entitycoreference/src/main/java/org/apache/stanbol/enhancer/engines/entitycoreference/Constants.java
 Wed Jul 22 18:58:38 2015
@@ -0,0 +1,72 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package org.apache.stanbol.enhancer.engines.entitycoreference;
+
+/**
+ * Constants used engine wide.
+ * 
+ * @author Cristian Petroaca
+ * 
+ */
+public final class Constants {
+       /**
+        * The main config folder of the engine
+        */
+       public final static String CONFIG_FOLDER = "/config";
+
+       /**
+        * The main data folder
+        */
+       public final static String DATA_FOLDER = "/data";
+
+       /**
+        * The path to the pos config folder.
+        */
+       public final static String POS_CONFIG_FOLDER = CONFIG_FOLDER + "/pos";
+
+       /**
+        * The path to the place adjectivals folder.
+        */
+       public final static String PLACE_ADJECTIVALS_FOLDER = DATA_FOLDER
+                       + "/place_adjectivals";
+
+       public static final int MAX_DISTANCE_DEFAULT_VALUE = 1;
+       
+    public static final int MAX_DISTANCE_NO_CONSTRAINT = -1;
+    
+       public final static String DEFAULT_SPATIAL_ATTR_FOR_PERSON = 
"http://dbpedia.org/ontology/birthPlace,";
+                       + 
"http://dbpedia.org/ontology/region,http://dbpedia.org/ontology/nationality,http://dbpedia.org/ontology/country";;
+
+       public final static String DEFAULT_SPATIAL_ATTR_FOR_ORGANIZATION = 
"http://dbpedia.org/ontology/foundationPlace,";
+                       + 
"http://dbpedia.org/ontology/locationCity,http://dbpedia.org/ontology/location,http://dbpedia.org/ontology/hometown";;
+       
+       public final static String DEFAULT_SPATIAL_ATTR_FOR_PLACE = 
"http://dbpedia.org/ontology/country,";
+                       + 
"http://dbpedia.org/ontology/subdivisionName,http://dbpedia.org/ontology/location";;
+       
+       public final static String DEFAULT_ENTITY_CLASSES_TO_EXCLUDE = 
"http://dbpedia.org/ontology/Person,";
+                       + 
"http://dbpedia.org/class/yago/LivingThing100004258,http://dbpedia.org/class/yago/PhysicalEntity100001930,";
+                       + 
"http://dbpedia.org/class/yago/Abstraction100002137,http://dbpedia.org/class/yago/Organism100004475,";
+                       + 
"http://dbpedia.org/class/yago/Location100027167,http://schema.org/Place,http://dbpedia.org/class/yago/Object100002684,";
+                       + 
"http://dbpedia.org/class/yago/YagoGeoEntity,http://www.w3.org/2002/07/owl#Thing,";
+                       + 
"http://dbpedia.org/class/yago/YagoPermanentlyLocatedEntity";;
+       
+       public final static String DEFAULT_ORG_ATTR_FOR_PERSON = 
"http://dbpedia.org/ontology/occupation,";
+                       + 
"http://dbpedia.org/ontology/associatedBand,http://dbpedia.org/ontology/employer";;
+       
+       private Constants() {
+       }
+}


Reply via email to