Hi Ruben
Thanks for reporting this and sorry for the delay
So I've checked your website
against the version of any23 v0.6.1 - which is currently used by inspector to parse documents
and also newer one which is
And in both cases it failed to extract any triples from your page with the same error
java.lang.IllegalArgumentException: Invalid content ''
at org.apache.any23.extractor.microdata.ItemPropValue.<init>(ItemPropValue.java:89)
at org.apache.any23.extractor.microdata.MicrodataParser.getPropertyValue(MicrodataParser.java:341)
at org.apache.any23.extractor.microdata.MicrodataParser.getItemProps(MicrodataParser.java:394)
at org.apache.any23.extractor.microdata.MicrodataParser.getItemScope(MicrodataParser.java:471)
at org.apache.any23.extractor.microdata.MicrodataParser.getMicrodata(MicrodataParser.java:186)
at org.apache.any23.extractor.microdata.MicrodataParser.getMicrodata(MicrodataParser.java:203)
at org.apache.any23.extractor.microdata.MicrodataExtractor.run(MicrodataExtractor.java:100)
at org.apache.any23.extractor.microdata.MicrodataExtractor.run(MicrodataExtractor.java:62)
at org.apache.any23.extractor.SingleDocumentExtraction.runExtractor(SingleDocumentExtraction.java:477)
at org.apache.any23.extractor.SingleDocumentExtraction.run(SingleDocumentExtraction.java:260)
at org.apache.any23.Any23.extract(Any23.java:294)
at org.apache.any23.Any23.extract(Any23.java:446)
at org.apache.any23.servlet.WebResponder.runExtraction(WebResponder.java:113)
at org.apache.any23.servlet.Servlet.doPost(Servlet.java:108)
at javax.servlet.http.HttpServlet.service(HttpServlet.java:637)
at javax.servlet.http.HttpServlet.service(HttpServlet.java:717)
at org.apache.catalina.core.ApplicationFilterChain.internalDoFilter(ApplicationFilterChain.java:290)
at org.apache.catalina.core.ApplicationFilterChain.doFilter(ApplicationFilterChain.java:206)
at org.apache.catalina.core.StandardWrapperValve.invoke(StandardWrapperValve.java:233)
at org.apache.catalina.core.StandardContextValve.invoke(StandardContextValve.java:191)
at org.apache.catalina.core.StandardHostValve.invoke(StandardHostValve.java:127)
at com.googlecode.psiprobe.Tomcat60AgentValve.invoke(Tomcat60AgentValve.java:30)
at org.apache.catalina.valves.ErrorReportValve.invoke(ErrorReportValve.java:102)
at org.apache.catalina.core.StandardEngineValve.invoke(StandardEngineValve.java:109)
at org.apache.catalina.connector.CoyoteAdapter.service(CoyoteAdapter.java:293)
at org.apache.coyote.http11.Http11Processor.process(Http11Processor.java:859)
at org.apache.coyote.http11.Http11Protocol$Http11ConnectionHandler.process(Http11Protocol.java:602)
at org.apache.tomcat.util.net.JIoEndpoint$Worker.run(JIoEndpoint.java:489)
at java.lang.Thread.run(Thread.java:662)
newest version 0.8.0
2013-08-09 16:06:52,597 [qtp0-2] INFO c.s.i.s.RDFExtractorServlet - contentType:text/html
2013-08-09 16:06:52,597 [qtp0-2] INFO c.s.i.s.RDFExtractorServlet - contentEncoding:UTF-8
2013-08-09 16:06:52,625 [qtp0-2] INFO c.s.i.s.RdfextractorHTTPClient - Content-Type [text/html; charset=utf-8] header found in the response
2013-08-09 16:06:52,693 [qtp0-2] ERROR c.s.i.RDFExtractor - An error occurred extracting metadata using any23
java.lang.IllegalArgumentException: Invalid content ''
at org.apache.any23.extractor.microdata.ItemPropValue.<init>(ItemPropValue.java:89) [apache-any23-core-0.8.0.jar:0.8.0]
at org.apache.any23.extractor.microdata.MicrodataParser.getPropertyValue(MicrodataParser.java:341) [apache-any23-core-0.8.0.jar:0.8.0]
at org.apache.any23.extractor.microdata.MicrodataParser.getItemProps(MicrodataParser.java:394) [apache-any23-core-0.8.0.jar:0.8.0]
at org.apache.any23.extractor.microdata.MicrodataParser.getItemScope(MicrodataParser.java:471) [apache-any23-core-0.8.0.jar:0.8.0]
at org.apache.any23.extractor.microdata.MicrodataParser.getMicrodata(MicrodataParser.java:186) [apache-any23-core-0.8.0.jar:0.8.0]
at org.apache.any23.extractor.microdata.MicrodataParser.getMicrodata(MicrodataParser.java:203) [apache-any23-core-0.8.0.jar:0.8.0]
at org.apache.any23.extractor.microdata.MicrodataExtractor.run(MicrodataExtractor.java:89) [apache-any23-core-0.8.0.jar:0.8.0]
at org.apache.any23.extractor.microdata.MicrodataExtractor.run(MicrodataExtractor.java:58) [apache-any23-core-0.8.0.jar:0.8.0]
at org.apache.any23.extractor.SingleDocumentExtraction.runExtractor(SingleDocumentExtraction.java:471) [apache-any23-core-0.8.0.jar:0.8.0]
at org.apache.any23.extractor.SingleDocumentExtraction.run(SingleDocumentExtraction.java:254) [apache-any23-core-0.8.0.jar:0.8.0]
at org.apache.any23.Any23.extract(Any23.java:295) [apache-any23-core-0.8.0.jar:0.8.0]
at org.apache.any23.Any23.extract(Any23.java:447) [apache-any23-core-0.8.0.jar:0.8.0]
at org.apache.any23.Any23.extract(Any23.java:377) [apache-any23-core-0.8.0.jar:0.8.0]
at com.sindice.inspector.RDFExtractor.extract(RDFExtractor.java:187) [classes/:na]
at com.sindice.inspector.RDFExtractor.extract(RDFExtractor.java:152) [classes/:na]
at com.sindice.inspector.servlet.RDFExtractorServlet.doRDFExtract(RDFExtractorServlet.java:910) [classes/:na]
at com.sindice.inspector.servlet.RDFExtractorServlet.extractTriplesFromDocumentPart(RDFExtractorServlet.java:519) [classes/:na]
at com.sindice.inspector.servlet.RDFExtractorServlet.doRDFExtract(RDFExtractorServlet.java:374) [classes/:na]
at com.sindice.inspector.servlet.RDFExtractorServlet.doPost(RDFExtractorServlet.java:166) [classes/:na]
at javax.servlet.http.HttpServlet.service(HttpServlet.java:713) [servlet-api-3.0.pre4.jar:na]
at javax.servlet.http.HttpServlet.service(HttpServlet.java:806) [servlet-api-3.0.pre4.jar:na]
at org.mortbay.jetty.servlet.ServletHolder.handle(ServletHolder.java:502) [jetty-7.0.0.pre5.jar:7.0.0.pre5]
at org.mortbay.jetty.servlet.ServletHandler$CachedChain.doFilter(ServletHandler.java:1121) [jetty-7.0.0.pre5.jar:7.0.0.pre5]
at com.sindice.inspector.servlet.filter.SameIpBlocker.doFilter(SameIpBlocker.java:88) [classes/:na]
at org.mortbay.jetty.servlet.ServletHandler$CachedChain.doFilter(ServletHandler.java:1112) [jetty-7.0.0.pre5.jar:7.0.0.pre5]
at org.mortbay.jetty.servlet.ServletHandler.handle(ServletHandler.java:363) [jetty-7.0.0.pre5.jar:7.0.0.pre5]
at org.mortbay.jetty.security.ConstraintsSecurityHandler.handle(ConstraintsSecurityHandler.java:220) [jetty-security-7.0.0.pre5.jar:7.0.0.pre5]
at org.mortbay.jetty.servlet.SessionHandler.handle(SessionHandler.java:181) [jetty-7.0.0.pre5.jar:7.0.0.pre5]
There might be a good reasons for these if you look at the validation results:
there are couple of errors you might want to fix and try again
At the moment we are working to update the any23 version to the newest one
The new version of the inspector is expected next week
If you think that your document is 100% valid you might want to
notify any23 team directly
All the Best
Szymon