Hi,

I have to say that everything works great for string, txt and doc files, as
well as web pages. I have only one confusion, and it is regarding pdf docs.
I attached results for this document
http://www.gtbit.org/downloads/dwdmsem6/dwdmsem6lman.pdf. I didn't access
document using this URL, but downloaded and access it as C:\temp\weka.pdf.
I get correct answer, I mean, there are no errors, but I think there should
be more annotated concepts.

Could you please try to annotate this document and compare results? I am
sure you will be able to find what I did wrong.

Best,
Srecko
<?xml version="1.0" encoding="windows-1252"?>
<rdf:RDF
    xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#";
    xmlns:j.0="http://www.semanticdesktop.org/ontologies/2007/01/19/nie#";
    xmlns:j.1="http://purl.org/dc/terms/";
    xmlns:j.2="http://www.semanticdesktop.org/ontologies/2007/03/22/nco#";
    xmlns:j.3="http://www.semanticdesktop.org/ontologies/2007/03/22/nfo#";
    xmlns:j.4="http://fise.iks-project.eu/ontology/"; > 
  <rdf:Description 
rdf:about="urn:content-item-sha1-f3e0ce27fa0eb5a69fec0c0dbaf90fcb456cdf55">
    <j.0:contentCreated 
rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime";>2008-04-30T18:58:05.000+02:00</j.0:contentCreated>
    <j.0:generator>Acrobat Distiller 7.0.5 (Windows)</j.0:generator>
    <j.0:generator>Acrobat PDFMaker 7.0.7 for Word</j.0:generator>
    <j.0:title>WEKA</j.0:title>
    <j.2:creator rdf:resource="urn:uuid:d4011136-3aa6-4c8b-919d-0a3506c20c31"/>
    <j.0:contentLastModified 
rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime";>2008-04-30T19:00:37.000+02:00</j.0:contentLastModified>
    <rdf:type 
rdf:resource="http://www.semanticdesktop.org/ontologies/2007/03/22/nfo#PaginatedTextDocument"/>
    <j.3:pageCount 
rdf:datatype="http://www.w3.org/2001/XMLSchema#integer";>22</j.3:pageCount>
  </rdf:Description>
  <rdf:Description rdf:about="urn:uuid:d4011136-3aa6-4c8b-919d-0a3506c20c31">
    <j.2:fullname>Shawn Richard</j.2:fullname>
    <rdf:type 
rdf:resource="http://www.semanticdesktop.org/ontologies/2007/03/22/nco#Contact"/>
  </rdf:Description>
  <rdf:Description 
rdf:about="urn:enhancement-7b92d553-3769-6136-4d37-5ceccdec0c7b">
    <j.4:confidence 
rdf:datatype="http://www.w3.org/2001/XMLSchema#double";>1.0</j.4:confidence>
    <rdf:type 
rdf:resource="http://fise.iks-project.eu/ontology/TextAnnotation"/>
    <j.1:creator 
rdf:datatype="http://www.w3.org/2001/XMLSchema#string";>org.apache.stanbol.enhancer.engines.metaxa.MetaxaEngine</j.1:creator>
    <j.1:created 
rdf:datatype="http://www.w3.org/2001/XMLSchema#dateTime";>2012-01-14T17:52:19.327Z</j.1:created>
    <j.4:extracted-from 
rdf:resource="urn:content-item-sha1-f3e0ce27fa0eb5a69fec0c0dbaf90fcb456cdf55"/>
    <rdf:type rdf:resource="http://fise.iks-project.eu/ontology/Enhancement"/>
  </rdf:Description>
</rdf:RDF>

Reply via email to