any23-commits mailing list archives

Site index · List index
Message view « Date » · « Thread »
Top « Date » · « Thread »
From ans...@apache.org
Subject svn commit: r1371537 [19/30] - in /incubator/any23/trunk: ./ core/ core/src/test/java/org/apache/any23/ core/src/test/java/org/apache/any23/cli/ core/src/test/java/org/apache/any23/extractor/ core/src/test/java/org/apache/any23/extractor/csv/ core/src/...
Date Fri, 10 Aug 2012 00:40:22 GMT
Added: incubator/any23/trunk/test-resources/src/test/resources/html/rdfa/rdfa-issue186-2.xhtml
URL: http://svn.apache.org/viewvc/incubator/any23/trunk/test-resources/src/test/resources/html/rdfa/rdfa-issue186-2.xhtml?rev=1371537&view=auto
==============================================================================
--- incubator/any23/trunk/test-resources/src/test/resources/html/rdfa/rdfa-issue186-2.xhtml (added)
+++ incubator/any23/trunk/test-resources/src/test/resources/html/rdfa/rdfa-issue186-2.xhtml Fri Aug 10 00:40:13 2012
@@ -0,0 +1,682 @@
+<?xml version="1.0" encoding="utf-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML+RDFa 1.0//EN" "http://www.w3.org/MarkUp/DTD/xhtml-rdfa-1.dtd">
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+
+   http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en"
+      xmlns:foaf="http://xmlns.com/foaf/0.1/"
+      xmlns:owl="http://www.w3.org/2002/07/owl#"
+      xmlns:bio="http://purl.org/vocab/bio/0.1/"
+      xmlns:dbpedia="http://dbpedia.org/resource/"
+      xmlns:ov="http://open.vocab.org/terms/"
+      xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#"
+      xmlns:dc="http://purl.org/dc/terms/"
+      xmlns:v="http://www.w3.org/2006/vcard/ns#"
+      xmlns:swc="http://data.semanticweb.org/ns/swc/ontology#"
+      xmlns:swrc="http://swrc.ontoware.org/ontology#"
+        >
+<head>
+    <title property="dc:title">Richard Cyganiak's Homepage</title>
+    <base href="http://richard.cyganiak.de/"/>
+    <link rel="openid2.provider" href="https://open.login.yahooapis.com/openid/op/auth"/>
+    <link rel="openid2.local_id" href="https://me.yahoo.com/cygri"/>
+    <link rel="stylesheet" href="style.css" type="text/css"/>
+    <link rel="meta" href="foaf.rdf" type="application/rdf+xml"/>
+    <link rel="meta" href="foaf.n3" type="text/rdf+n3"/>
+    <link rel="foaf:primaryTopic foaf:maker" rev="foaf:homepage" href="#me"/>
+</head>
+
+<body about="#me" typeof="foaf:Person">
+
+<h1 property="foaf:name">Richard Cyganiak</h1>
+
+<div class="userpic" rel="foaf:img">
+    <img src="/2007/01/richard.jpg" alt="A photo of me"/>
+</div>
+
+<dl>
+    <dt>Mini bio:</dt>
+    <dd property="bio:olb" datatype="">Semantic Web evangelist. Researcher and engineer at <a
+            rel="foaf:workplaceHomepage" href="http://www.deri.ie/">DERI Galway</a>, Ireland. Berlin native.
+    </dd>
+
+    <dt>Interests:</dt>
+    <dd rel="foaf:topic_interest">
+        <span resource="[dbpedia:Semantic_Web]">Semantic Web</span>,
+        <span resource="[dbpedia:Linked_Data]">Linked Data</span>,
+        <span resource="[dbpedia:Resource_Description_Framework]">RDF</span>,
+        <span resource="[dbpedia:Data_integration]">data integration</span>,
+        <span resource="[dbpedia:Software_development]">software development</span>,
+        <span resource="[dbpedia:Go_(game)]">Go</span>,
+        <span resource="[dbpedia:Apple_Inc.]">Apple</span>
+    </dd>
+
+    <dt>Weblog:</dt>
+    <dd><a rel="foaf:weblog" href="http://dowhatimean.net/">dowhatimean.net</a></dd>
+
+    <dt>Email:</dt>
+    <dd><a rel="foaf:mbox" href="mailto:richard@cyganiak.de">richard@cyganiak.de</a></dd>
+
+    <dt>Skype:</dt>
+    <dd property="ov:skypeID">richard.cyganiak</dd>
+
+    <dt>Phone:</dt>
+    <dd rel="foaf:phone" resource="tel:+353-872206327">+353-87-2206327</dd>
+
+    <dt>IRC nick:</dt>
+    <dd property="foaf:nick">cygri</dd>
+
+    <dt>Home address:</dt>
+    <dd rel="v:homeAdr">
+  <span typeof="v:Address">
+    <span property="v:street-address">15 Greenfields Road</span>,
+    Newcastle,
+    <span property="v:locality">Galway</span>,
+    <span property="v:country-name">Ireland</span>
+    (<a rel="foaf:page"
+        href="http://maps.google.co.uk/maps/ms?ie=UTF8&amp;hl=en&amp;t=h&amp;msa=0&amp;ll=53.286554,-9.071601&amp;spn=0.001613,0.003256&amp;z=18&amp;msid=112557952290247281008.00045d9f04b3ad60a619f">Google
+      Maps</a>)
+  </span>
+    </dd>
+
+    <dt>Work address:</dt>
+    <dd rel="v:workAdr">
+  <span typeof="v:Address">
+    Office 102,
+    <span property="v:extended-address" datatype=""><a href="http://www.deri.ie/">Digital Enterprise Research
+        Institute</a>, NUI Galway</span>,
+    <span property="v:street-address">Lower Dangan</span>,
+    <span property="v:locality">Galway</span>,
+    <span property="v:country-name">Ireland</span>
+    (<a rel="foaf:page"
+        href="http://maps.google.co.uk/maps/ms?ie=UTF8&amp;hl=en&amp;t=h&amp;msa=0&amp;msid=112557952290247281008.00045d9f09460db317d5b&amp;ll=53.290065,-9.074053&amp;spn=0.003226,0.006512&amp;z=17">Google
+      Maps</a>)
+  </span>
+    </dd>
+
+    <dt>URI:</dt>
+    <dd><a rel="owl:sameAs"
+           href="http://richard.cyganiak.de/foaf.rdf#cygri">http://richard.cyganiak.de/foaf.rdf#cygri</a></dd>
+</dl>
+
+<h2>Web properties</h2>
+
+<ul>
+    <li><a rel="me foaf:weblog" href="http://dowhatimean.net/"><span property="rdfs:label">My weblog</span></a></li>
+    <li><img src="/images/foaf.png" alt=""/> <a rel="me rdfs:seeAlso" href="http://richard.cyganiak.de/foaf.rdf"><span
+            property="rdfs:label">My FOAF file</span></a></li>
+    <li><a rel="me foaf:holdsAccount" href="http://twitter.com/cygri"><span
+            property="rdfs:label">Me in Twitter</span></a></li>
+    <li><a rel="me foaf:holdsAccount" href="http://flickr.com/photos/cygri"><span
+            property="rdfs:label">Me in Flickr</span></a></li>
+    <li><a rel="me foaf:holdsAccount" href="http://www.facebook.com/people/Richard_Cyganiak/555777583"><span
+            property="rdfs:label">Me in Facebook</span></a></li>
+    <li><a rel="me foaf:holdsAccount" href="http://www.linkedin.com/in/cygri"><span
+            property="rdfs:label">Me in LinkedIn</span></a></li>
+    <li><a rel="me foaf:holdsAccount" href="http://delicious.com/cygri"><span
+            property="rdfs:label">Me in delicious</span></a></li>
+    <li><a rel="me foaf:holdsAccount" href="http://www.dopplr.com/traveller/cygri"><span property="rdfs:label">Me in Dopplr</span></a>
+    </li>
+    <li><a rel="me foaf:holdsAccount" href="http://www.last.fm/user/cygri"><span
+            property="rdfs:label">Me in last.fm</span></a></li>
+</ul>
+
+<h2>Current projects</h2>
+
+<dl rel="foaf:currentProject">
+    <dt about="#sindice"><a rel="foaf:homepage" property="foaf:name" href="http://sindice.com/">Sindice.com</a></dt>
+    <dd about="#sindice" property="rdfs:comment" datatype="">An experimental search engine for the Web of Data. The
+        project is lead by <a href="http://g1o.net/">Giovanni Tummarello</a>. I joined in late 2007.
+    </dd>
+
+    <dt about="#d2rq"><a rel="foaf:homepage" property="foaf:name" href="http://d2rq.org/">D2RQ and D2R Server</a></dt>
+    <dd about="#d2rq" property="rdfs:comment" datatype="">An open-source project aimed at making relational databases
+        part of the Web of Data. Originally founded by <a href="http://bizer.de/">Chris Bizer</a>. I have maintained
+        D2RQ and D2R Server since 2005.
+    </dd>
+
+    <dt about="#neologism"><a rel="foaf:homepage" property="foaf:name" href="http://code.google.com/p/neologism/">Neologism</a>
+    </dt>
+    <dd about="#neologism" property="rdfs:comment">An open-source publishing platform for RDFS vocabularies. Currently
+        in Alpha stage. I founded this project in 2008.
+    </dd>
+
+    <dt about="#dbpedia"><a rel="foaf:homepage" property="foaf:name" href="http://dbpedia.org/">DBpedia</a></dt>
+    <dd about="#dbpedia" property="rdfs:comment">Extracting structured RDF information from Wikipedia. A large community
+        project involving several universities and companies. I have contributed to the original extraction framework
+        and have developed and maintained DBpedia's HTML frontend during much of 2007 and 2008.
+    </dd>
+
+    <dt about="#lod"><a rel="foaf:homepage" property="foaf:name"
+                        href="http://esw.w3.org/topic/SweoIG/TaskForces/CommunityProjects/LinkingOpenData">Linking Open
+        Data</a></dt>
+    <dd about="#lod" property="rdfs:comment" datatype="">A community effort to convert existing sources of open data to
+        RDF an make them part of the Semantic Web. I'm a co-founder of the project, together with <a
+                href="http://bizer.de/">Chris Bizer</a>. My main contribution is in helping to establish best practices
+        for publishing RDF on the Web, and maintaining the <a href="http://richard.cyganiak.de/2007/10/lod/">LOD dataset
+            cloud</a> diagram.
+    </dd>
+
+    <dt about="#semantic-sitemaps"><a rel="foaf:homepage" property="foaf:name"
+                                      href="http://sw.deri.org/2007/07/sitemapextension/">Semantic Sitemaps</a></dt>
+    <dd about="#semantic-sitemaps" property="rdfs:comment" datatype="">A proposed standard for improving RDF discovery,
+        originally designed by <a href="http://g1o.net/">Giovanni Tummarello</a>.
+    </dd>
+
+    <dt about="#void"><a rel="foaf:homepage" property="foaf:name" href="http://semanticweb.org/wiki/VoiD">voiD</a></dt>
+    <dd about="#void" property="rdfs:comment">A work-in-progress RDFS vocabulary for describing the contents of RDF
+        datasets.
+    </dd>
+
+    <dt about="#pubby"><a rel="foaf:homepage" property="foaf:name"
+                          href="http://www4.wiwiss.fu-berlin.de/pubby/">Pubby</a></dt>
+    <dd about="#pubby" property="rdfs:comment">A Linked Data server that exposes RDF data from SPARQL endpoints.
+        Originally developed for DBpedia.
+    </dd>
+
+    <dt about="#disco"><a rel="foaf:homepage" property="foaf:name"
+                          href="http://www4.wiwiss.fu-berlin.de/bizer/ng4j/disco/">Disco</a></dt>
+    <dd about="#disco" property="rdfs:comment">A simple RDF browser. Developed together with Tobias Gauß.</dd>
+
+    <dt>Miscellaneous</dt>
+    <dd>
+        <ul>
+            <li about="#accept-header-test">(03/2008) <a rel="foaf:homepage" property="foaf:name"
+                                                         href="http://dowhatimean.net/2008/03/what-is-your-rdf-browsers-accept-header">Accept
+                header test for RDF clients</a>: <span property="rdfs:comment">Small utility service to help implementers of content negotiation</span>
+            </li>
+            <li about="#foaf-geolocator">(03/2006) <a rel="foaf:homepage" property="foaf:name"
+                                                      href="http://dowhatimean.net/2006/03/adding-geo-cordinates-to-your-foaf-file">FOAF
+                geolocator</a>: <span property="rdfs:comment">Add geographic coordinates to your FOAF file</span></li>
+        </ul>
+    </dd>
+</dl>
+
+<h2>Past projects</h2>
+
+<dl rel="foaf:pastProject">
+    <dt about="#statcvs-statsvn"><a rel="foaf:homepage" property="foaf:name" href="http://statcvs.sourceforge.net/">StatCVS/StatSVN</a>
+    </dt>
+    <dd about="#statcvs-statsvn" property="rdfs:comment">StatCVS generates colorful reports from CVS repository logs. I
+        maintained the open-source project from 2002 to 2008. A port to Subversion, called StatSVN, was created by Jason
+        Kealey and Benoit Xhenseval. They took over maintenance of StatCVS in 2008.
+    </dd>
+
+    <dt about="#ng4j"><a rel="foaf:homepage" property="foaf:name" href="http://www4.wiwiss.fu-berlin.de/bizer/ng4j/">NG4J</a>
+    </dt>
+    <dd about="#ng4j" property="rdfs:comment" datatype="">NG4J provided support for <a
+            href="http://www.w3.org/2004/03/trix/">Named Graphs</a> long before this feature became standard in all RDF
+        stores. The project was initiated by Chris Bizer, and I maintained it throughout most of its lifetime.
+    </dd>
+
+    <dt about="#wiqa"><a rel="foaf:homepage" property="foaf:name"
+                         href="http://www4.wiwiss.fu-berlin.de/bizer/WIQA/index.htm">WIQA</a></dt>
+    <dd about="#wiqa" property="rdfs:comment" datatype="">A policy framework for Web Information Quality Assurance, part
+        of <a href="http://bizer.de/">Chris Bizer</a>'s doctoral thesis. I did parts of the implementation.
+    </dd>
+
+    <dt><a rel="rdfs:seeAlso" href="2008/12/old-stuff.html#projekte">Old stuff</a></dt>
+    <dd>Some very old projects. Page in German.</dd>
+</dl>
+
+<h2>Publications</h2>
+
+<p>I occasionally blog at <a href="http://dowhatimean.net/">dowhatimean.net</a>.</p>
+
+<p>There is a <a href="2008/12/old-stuff.html#dokumente">list of my very old publications</a> (page in German). Once
+    upon a time, I did some blogging in German <a href="/blog/">here</a>.</p>
+
+<h3>Tutorials and HOWTOs</h3>
+
+<dl rev="dc:creator">
+    <dt>
+        <a href="http://videolectures.net/iswc08_heath_hpldw/"><span property="dc:title">How to Publish Linked Data on the Web</span></a>
+        (Video, ISWC 2008)
+    </dt>
+    <dd>
+        Tom Heath, Michael Hausenblas, Christian Bizer, Richard Cyganiak, Olaf Hartig.
+        Tutorial at ISWC 2008, Karlsruhe.
+        Published at videolectures.net.
+    </dd>
+
+    <dt>
+        <a href="http://www4.wiwiss.fu-berlin.de/bizer/pub/LinkedDataTutorial/"><span property="dc:title">How to Publish Linked Data on the Web</span></a>
+    </dt>
+    <dd>
+        Christian Bizer, Richard Cyganiak, Tom Heath.
+        Tutorial, 2007.
+    </dd>
+
+    <dt>
+        <a href="http://www.w3.org/TR/cooluris/"><span property="dc:title">Cool URIs for the Semantic Web</span></a>
+    </dt>
+    <dd>
+        Leo Sauermann, Richard Cyganiak, Danny Ayers, Max Völkel.
+        W3C Interest Group Note, 2008.
+    </dd>
+
+    <dt>
+        <a href="http://dowhatimean.net/2007/02/debugging-semantic-web-sites-with-curl"><span property="dc:title">Debugging Semantic Web sites with cURL</span></a>
+    </dt>
+    <dd>
+        Tutorial, 2007.
+    </dd>
+</dl>
+
+
+<h3>Peer-reviewed</h3>
+
+<dl class="academic-publications" rev="dc:creator">
+    <dt>
+        Quality-Driven Information Filtering Using the WIQA Policy Framework
+        (JWS, 2008)
+    </dt>
+    <dd typeof="swrc:Article">
+        <span rel="swrc:author" resource="[_:christian_bizer]"><span property="foaf:name">Christian Bizer</span></span>,
+        <span rel="swrc:author" resource="#me"><span property="foaf:name">Richard Cyganiak</span></span>,
+        <a property="dc:title" rel="swrc:url"
+           href="http://www.sciencedirect.com/science?_ob=ArticleURL&amp;_udi=B758F-4SB9DY9-1&amp;_user=103680&amp;_rdoc=1&amp;_fmt=&amp;_orig=search&amp;_sort=d&amp;view=c&amp;_acct=C000007922&amp;_version=1&amp;_urlVersion=0&amp;_userid=103680&amp;md5=5365a5bc668dadd8c82293401193d3d1">Quality-Driven
+            Information Filtering Using the WIQA Policy Framework</a> (Article in Press).
+        <span property="swrc:journal">Journal of Web Semantics: Science, Services and Agents on the World Wide Web</span>,
+        <span property="swrc:year">2008</span>.
+    </dd>
+
+    <dt>
+        Neologism – Easy Vocabulary Publishing
+        (SFSW2008)
+    </dt>
+    <dd typeof="swrc:InProceedings">
+        <span rel="swrc:author" resource="[_:cosmin_basca]"><span property="foaf:name">Cosmin Basca</span></span>,
+        <span rel="swrc:author" resource="[_:stephane_corlosquet]"><span property="foaf:name">Stéphane Corlosquet</span></span>,
+        <span rel="swrc:author" resource="#me"><span property="foaf:name">Richard Cyganiak</span></span>,
+        <span rel="swrc:author" resource="[_:sergio_fernandez]"><span
+                property="foaf:name">Sergio Fernández</span></span>,
+        <span rel="swrc:author" resource="[_:thomas_schandl]"><span property="foaf:name">Thomas Schandl</span></span>:
+        <span property="dc:title">Neologism – Easy Vocabulary Publishing</span>.
+        <span property="ov:presentedAt">4th Workshop on Scripting for the Semantic Web, Tenerife, Spain</span>,
+        <span property="swrc:month">June</span> <span property="swrc:year">2008</span>.
+        (<a rel="swrc:url" href="/2008/papers/neologism-sfsw2008.pdf">PDF</a>)
+    </dd>
+
+    <dt>
+        Semantic Sitemaps – Efficient and Flexible Access to Datasets on the Semantic Web
+        (ESWC2008)
+    </dt>
+    <dd typeof="swrc:InProceedings">
+        <span rel="swrc:author" resource="#me"><span property="foaf:name">Richard Cyganiak</span></span>,
+        <span rel="swrc:author" resource="[_:holger_stenzhorn]"><span
+                property="foaf:name">Holger Stenzhorn</span></span>,
+        <span rel="swrc:author" resource="[_:renaud_delbru]"><span property="foaf:name">Renaud Delbru</span></span>,
+        <span rel="swrc:author" resource="[_:stefan_decker]"><span property="foaf:name">Stefan Decker</span></span>,
+        <span rel="swrc:author" resource="[_:giovanni_tummarello]"><span property="foaf:name">Giovanni Tummarello</span></span>:
+        <span property="dc:title">Semantic Sitemaps – Efficient and Flexible Access to Datasets on the Semantic Web</span>.
+        <span property="ov:presentedAd">5th European Semantic Web Conference, Tenerife, Spain</span>,
+        <span property="swrc:month">June</span> <span property="swrc:year">2008</span>.
+        (<a rel="swrc:url" href="/2008/papers/sitemaps-eswc2008.pdf">PDF</a>)
+    </dd>
+
+    <dt>
+        Browsing Linked Data with Fenfire
+        (Demo at LDOW2008)
+    </dt>
+    <dd typeof="swrc:InProceedings">
+        <span rel="swrc:author" resource="[_:tuukka_hastrup]"><span property="foaf:name">Tuukka Hastrup</span></span>,
+        <span rel="swrc:author" resource="#me"><span property="foaf:name">Richard Cyganiak</span></span>,
+        <span rel="swrc:author" resource="[_:uldis_bojars]"><span property="foaf:name">Uldis Bojārs</span></span>:
+        <span property="dc:title">Browsing Linked Data with Fenfire (Demo)</span>.
+        <span property="ov:presentedAd">Workshop on Linked Data on the Web (LDOW2008), Beijing, China</span>,
+        <span property="swrc:month">April</span> <span property="swrc:year">2008</span>.
+        (<a rel="swrc:url" href="/2008/papers/fenfire-ldow2008.pdf">PDF</a>)
+    </dd>
+
+    <dt>
+        Weaving SIOC into the Web of Linked Data
+        (LDOW2008)
+    </dt>
+    <dd typeof="swrc:InProceedings">
+        <span rel="swrc:author" resource="[_:uldis_bojars]"><span property="foaf:name">Uldis Bojārs</span></span>,
+        <span rel="swrc:author" resource="[_:alexandre_passant]"><span
+                property="foaf:name">Alexandre Passant</span></span>,
+        <span rel="swrc:author" resource="#me"><span property="foaf:name">Richard Cyganiak</span></span>,
+        <span rel="swrc:author" resource="[_:john_breslin]"><span property="foaf:name">John Breslin</span></span>:
+        <span property="dc:title">Weaving SIOC into the Web of Linked Data</span>.
+        <span property="ov:presentedAd">Workshop on Linked Data on the Web (LDOW2008), Beijing, China</span>,
+        <span property="swrc:month">April</span> <span property="swrc:year">2008</span>.
+        (<a rel="swrc:url" href="/2008/papers/sioc-ldow2008.pdf">PDF</a>)
+    </dd>
+
+    <dt>
+        Sindice.com – A Document-oriented Lookup Index for Open Linked Data
+        (IJMSO, 2008)
+    </dt>
+    <dd typeof="swrc:Article">
+        <span rel="swrc:author" resource="[_:eyal_oren]"><span property="foaf:name">Eyal Oren,</span></span>
+        <span rel="swrc:author" resource="[_:renaud_delbru]"><span property="foaf:name">Renaud Delbru,</span></span>
+        <span rel="swrc:author" resource="[_:michele_catasta]"><span property="foaf:name">Michele Catasta,</span></span>
+        <span rel="swrc:author" resource="#me"><span property="foaf:name">Richard Cyganiak,</span></span>
+        <span rel="swrc:author" resource="[_:holger_stenzhorn]"><span
+                property="foaf:name">Holger Stenzhorn,</span></span>
+        <span rel="swrc:author" resource="[_:giovanni_tummarello]"><span property="foaf:name">Giovanni Tummarello</span></span>:
+        <span property="dc:title">Sindice.com – A Document-oriented Lookup Index for Open Linked Data</span>.
+        <span property="swrc:journal">International Journal of Metadata, Semantics and Ontologies, 3 (1)</span>,
+        <span property="swrc:year">2008</span>.
+        (<a rel="swrc:url" href="/2008/papers/sindice-ijmso2008.pdf">PDF</a>)
+    </dd>
+</dl>
+
+<h4>2007</h4>
+
+<dl class="academic-publications" rev="dc:creator">
+    <dt>
+        DBpedia – A Nucleus for a Web of Open Data
+        (ISWC2007)
+    </dt>
+    <dd typeof="swrc:InProceedings">
+        <span rel="swrc:author" resource="[_:soren_auer]"><span property="foaf:name">Sören Auer</span></span>,
+        <span rel="swrc:author" resource="[_:christian_bizer]"><span property="foaf:name">Christian Bizer</span></span>,
+        <span rel="swrc:author" resource="[_:georgi_kobilarov]"><span
+                property="foaf:name">Georgi Kobilarov</span></span>,
+        <span rel="swrc:author" resource="[_:jens_lehmann]"><span property="foaf:name">Jens Lehmann</span></span>,
+        <span rel="swrc:author" resource="#me"><span property="foaf:name">Richard Cyganiak</span></span>,
+        <span rel="swrc:author" resource="[_:zachary_ives]"><span property="foaf:name">Zachary Ives</span></span>:
+        <span property="dc:title">DBpedia – A Nucleus for a Web of Open Data</span>.
+        <span property="ov:presentedAd">6th International Semantic Web Conference (ISWC 2007), Busan, Korea</span>,
+        <span property="swrc:month">November</span> <span property="swrc:year">2007</span>.
+        (<a rel="swrc:url" href="/2008/papers/dbpedia-iswc2007.pdf">PDF</a>)
+    </dd>
+
+    <dt>
+        D2RQ – Lessons Learned
+        (W3C RdfRDB 2007)
+    </dt>
+    <dd typeof="swrc:InProceedings">
+        <span rel="swrc:author" resource="[_:chrisitan_bizer]"><span property="foaf:name">Chrisitan Bizer</span></span>,
+        <span rel="swrc:author" resource="#me"><span property="foaf:name">Richard Cyganiak</span></span>:
+        <a property="dc:title" rel="swrc:url" href="http://www.w3.org/2007/03/RdfRDB/papers/d2rq-positionpaper/">D2RQ –
+            Lessons Learned</a>.
+        <span property="ov:presentedAd">W3C Workshop on RDF Access to Relational Databases, Boston, USA</span>,
+        <span property="swrc:month">October</span> <span property="swrc:year">2007</span>
+    </dd>
+
+    <dt>
+        DBpedia – A Nucleus for a Web of Open Data
+        (Poster at CSSW2007)
+    </dt>
+    <dd typeof="swrc:InProceedings">
+        <span rel="swrc:author" resource="[_:christian_bizer]"><span property="foaf:name">Christian Bizer</span></span>,
+        <span rel="swrc:author" resource="#me"><span property="foaf:name">Richard Cyganiak</span></span>:
+        <span property="dc:title">DBpedia – A Nucleus for a Web of Open Data (Poster)</span>.
+        <span property="ov:presentedAd">SABRE Conference on Social Semantic Web (CSSW 2007), Leipzig, Germany</span>,
+        <span property="swrc:month">September</span> <span property="swrc:year">2007</span>.
+        (<a href="/2008/posters/dbpedia-cssw2007.pdf">Poster</a>)
+    </dd>
+
+    <dt>
+        RDF Book Mashup – From Web APIs to a Web of Data
+        (SFSW2007)
+    </dt>
+    <dd typeof="swrc:InProceedings">
+        <span rel="swrc:author" resource="[_:christian_bizer]"><span property="foaf:name">Christian Bizer</span></span>,
+        <span rel="swrc:author" resource="#me"><span property="foaf:name">Richard Cyganiak</span></span>,
+        <span rel="swrc:author" resource="[_:tobias_gauss]"><span property="foaf:name">Tobias Gauß</span></span>:
+        <span property="dc:title">The RDF Book Mashup – From Web APIs to a Web of Data</span>.
+        <span property="ov:presentedAd">3rd Workshop on Scripting for the Semantic Web (SFSW2007), Innsbruck, Austria</span>,
+        <span property="swrc:month">June</span> <span property="swrc:year">2007</span>
+        (<a rel="swrc:url" href="/2008/papers/bookmashup-sfsw2007.pdf">PDF</a>)
+    </dd>
+
+    <dt>
+        DBpedia – Querying Wikipedia like a Database
+        (Dev Track at WWW2007)
+    </dt>
+    <dd typeof="swrc:InProceedings">
+        <span rel="swrc:author" resource="[_:christian_bizer]"><span property="foaf:name">Christian Bizer</span></span>,
+        <span rel="swrc:author" resource="[_:soren_auer]"><span property="foaf:name">Sören Auer</span></span>,
+        <span rel="swrc:author" resource="#me"><span property="foaf:name">Richard Cyganiak</span></span>,
+        <span rel="swrc:author" resource="[_:georgi_kobilarov]"><span
+                property="foaf:name">Georgi Kobilarov</span></span>:
+        <span property="dc:title">DBpedia – Querying Wikipedia like a Database</span>.
+        <span property="ov:presentedAd">16th International World Wide Web Conference (WWW2007), Banff, Canada</span>,
+        <span property="swrc:month">May</span> <span property="swrc:year">2007</span>.
+    </dd>
+</dl>
+
+<h4>2006</h4>
+
+<dl class="academic-publications" rev="dc:creator">
+    <dt>
+        D2R Server – A Semantic Web Front-end to Existing Relational Databases
+        (Poster at BXMLT2006)
+    </dt>
+    <dd typeof="swrc:InProceedings">
+        <span rel="swrc:author" resource="#me"><span property="foaf:name">Richard Cyganiak</span></span>,
+        <span rel="swrc:author" resource="[_:christian_bizer]"><span property="foaf:name">Christian Bizer</span></span>:
+        <span property="dc:title">D2R Server – A Semantic Web Front-end to Existing Relational Databases (Poster)</span>.
+        <span property="ov:presentedAd">Berliner XML Tage, Berlin, Germany</span>,
+        <span property="swrc:month">September</span> <span property="swrc:year">2006</span>.
+        (<a rel="swrc:url" href="/2008/papers/d2r-server-bxmlt2006.pdf">PDF</a>)
+        (<a href="/2008/posters/d2r-server-bxmlt2006.pdf">Poster</a>)
+    </dd>
+
+    <dt>
+        DODA 0.1 – An Ontology for Lightweight Integration of Semantic Data Access Technologies
+        (SIIK2006)
+    </dt>
+    <dd typeof="swrc:InProceedings">
+        <span rel="swrc:author" resource="[_:giovanni_tummarello]"><span property="foaf:name">Giovanni Tummarello</span></span>,
+        <span rel="swrc:author" resource="[_:christian_morbidoni]"><span property="foaf:name">Christian Morbidoni</span></span>,
+        <span rel="swrc:author" resource="[_:michele_nucci]"><span property="foaf:name">Michele Nucci</span></span>,
+        <span rel="swrc:author" resource="#me"><span property="foaf:name">Richard Cyganiak</span></span>:
+        <span property="dc:title">DODA 0.1 – An Ontology for Lightweight Integration of Semantic Data Access Technologies</span>.
+        <span property="ov:presentedAd">1st International Workshop on Semantic Information Integration on Knowledge Discovery (SIIK 2006), Yogyakarta, Indonesia</span>,
+        <span property="swrc:month">December</span> <span property="swrc:year">2006</span>.
+        (<a rel="swrc:url" href="/2008/papers/doda-siik2006.pdf">PDF</a>)
+    </dd>
+
+    <dt>
+        The DODA Ontology – Lightweight Integration of Semantic Data Access Technologies
+        (SWAP2006)
+    </dt>
+    <dd typeof="swrc:InProceedings">
+        <span rel="swrc:author" resource="[_:christian_morbidoni]"><span property="foaf:name">Christian Morbidoni</span></span>,
+        <span rel="swrc:author" resource="[_:giovanni_tummarello]"><span property="foaf:name">Giovanni Tummarello</span></span>,
+        <span rel="swrc:author" resource="[_:michele_nucci]"><span property="foaf:name">Michele Nucci</span></span>,
+        <span rel="swrc:author" resource="#me"><span property="foaf:name">Richard Cyganiak</span></span>:
+        <span property="dc:title">The DODA Ontology – Lightweight Integration of Semantic Data Access Technologies</span>.
+        <span property="ov:presentedAd">3rd Italian Semantic Web Workshop (SWAP 2006), Pisa, Italy</span>,
+        <span property="swrc:month">December</span> <span property="swrc:year">2006</span>.
+        (<a rel="swrc:url" href="/2008/papers/doda-swap2006.pdf">PDF</a>)
+    </dd>
+
+    <dt>
+        D2R Server – Publishing Releational Databases on the Semantic Web
+        (Poster at ISWC2006)
+    </dt>
+    <dd typeof="swrc:InProceedings">
+        <span rel="swrc:author" resource="[_:christian_bizer]"><span property="foaf:name">Christian Bizer</span></span>,
+        <span rel="swrc:author" resource="#me"><span property="foaf:name">Richard Cyganiak</span></span>:
+        <span property="dc:title">D2R Server – Publishing Releational Databases on the Semantic Web (Poster)</span>.
+        <span property="ov:presentedAd">5th International Semantic Web Conference, Athens, USA</span>,
+        <span property="swrc:month">November</span> <span property="swrc:year">2006</span>.
+        (<a rel="swrc:url" href="/2008/papers/d2r-server-iswc2006.pdf">PDF</a>)
+        (<a href="/2008/posters/d2r-server-iswc2006.pdf">Poster</a>)
+    </dd>
+
+    <dt>
+        D2R Server – Publishing Relational Databases on the Web as SPARQL Endpoints
+        (Dev Track at WWW2006)
+    </dt>
+    <dd typeof="swrc:InProceedings">
+        <span rel="swrc:author" resource="#me"><span property="foaf:name">Richard Cyganiak</span></span>,
+        <span rel="swrc:author" resource="[_:christian_bizer]"><span property="foaf:name">Christian Bizer</span></span>:
+        <span property="dc:title">D2R Server – Publishing Relational Databases on the Web as SPARQL Endpoints</span>.
+        <span property="ov:presentedAd">15th International World Wide Web Conference (WWW2006), Edinburgh, Scotland</span>,
+        <span property="swrc:month">May</span> <span property="swrc:year">2006</span>.
+    </dd>
+</dl>
+
+<h4>2005</h4>
+
+<dl class="academic-publications" rev="dc:creator">
+    <dt>
+        The TriQL.P Browser – Filtering Information using Context-, Content- and Rating-Based Trust Policies
+        (SWPW2005)
+    </dt>
+    <dd typeof="swrc:InProceedings">
+        <span rel="swrc:author" resource="[_:christian_bizer]"><span property="foaf:name">Christian Bizer</span></span>,
+        <span rel="swrc:author" resource="#me"><span property="foaf:name">Richard Cyganiak</span></span>,
+        <span rel="swrc:author" resource="[_:tobias_gauss]"><span property="foaf:name">Tobias Gauß</span></span>,
+        <span rel="swrc:author" resource="[_:and_oliver_maresch]"><span
+                property="foaf:name">and Oliver Maresch</span></span>:
+        <span property="dc:title">The TriQL.P Browser – Filtering Information using Context-, Content- and Rating-Based Trust Policies</span>.
+        <span property="ov:presentedAd">Semantic Web and Policy Workshop at the 4th International Semantic Web Conference, Galway, Ireland</span>,
+        <span property="swrc:month">November</span> <span property="swrc:year">2005</span>.
+        (<a rel="swrc:url" href="/2008/papers/triqlp-swpw2005.pdf">PDF</a>)
+    </dd>
+
+    <dt>NG4J – Named Graphs API for Jena
+        (Poster, ESWC2005)
+    </dt>
+    <dd typeof="swrc:InProceedings">
+        <span rel="swrc:author" resource="[_:christian_bizer]"><span property="foaf:name">Christian Bizer</span></span>,
+        <span rel="swrc:author" resource="#me"><span property="foaf:name">Richard Cyganiak</span></span>,
+        <span rel="swrc:author" resource="[_:rowland_watkins]"><span property="foaf:name">Rowland Watkins</span></span>:
+        <span property="dc:title">NG4J – Named Graphs API for Jena (Poster)</span>.
+        <span property="ov:presentedAd">2nd European Semantic Web Conference (ESWC 2005), Heraklion, Greece</span>,
+        <span property="swrc:month">May</span> <span property="swrc:year">2005</span>.
+        (<a rel="swrc:url" href="/2008/papers/ng4j-eswc2005.pdf">PDF</a>)
+        (<a href="/2008/posters/ng4j-eswc2005.pdf">Poster</a>)
+    </dd>
+</dl>
+
+
+<h2>Talks and slides</h2>
+
+<p>@@@ Some day I will upload all my presentations to SlideShare. For now, just some notes.</p>
+
+<ul>
+    <li>See publication list above</li>
+    <li>Linked Data in 7 Easy Steps, Tutorial, ISWC2008</li>
+    <li>Using the Web of Data, WOD-PD 2008</li>
+    <li>There's more than US-ASCII, lightning talk at ESWC2008</li>
+    <li>Sindice.com, lightning talk at LOD Gathering, ESWC2008</li>
+    <li>Sindice.com, Linked Data Planet, 2008</li>
+    <li>Web of Data, XTech 2008</li>
+    <li>Linking Open Data, New York Semantic Web Meetup, 2008</li>
+    <li>D2RQ, W3C RDF2RDB XG, 2008</li>
+    <li>Semantics and Complexity of SPARQL, DERI Reading Group, 2007</li>
+    <li>D2R Server, JUC 2006</li>
+    <li>D2RQ, HP Labs, 2005</li>
+</ul>
+
+
+<h2>Posters</h2>
+
+<p>All of these are made with <a href="http://www.omnigroup.com/applications/OmniGraffle/">OmniGraffle</a>. On some, I
+    have contributed not as an author but only by creating the poster itself.</p>
+
+<p class="posters">
+    <a href="/2008/posters/dbpedia-cssw2007.pdf"><img src="/2008/posters/dbpedia-cssw2007.png"
+                                                      title="DBpedia – A Nucleus for the Web of Open Data (CSSW2007)"
+                                                      alt="Poster thumbnail"/></a>
+    <a href="/2008/posters/lod-eswc2007.pdf"><img src="/2008/posters/lod-eswc2007.png"
+                                                  title="Linking Open Data (ESWC2007)" alt="Poster thumbnail"/></a>
+    <a href="/2008/posters/d2r-server-bxmlt2006.pdf"><img src="/2008/posters/d2r-server-bxmlt2006.png"
+                                                          title="D2R Server – A Semantic Web Front-end to Existing Relational Databases (BXMLT2006)"
+                                                          alt="Poster thumbnail"/></a>
+    <a href="/2008/posters/d2r-server-iswc2006.pdf"><img src="/2008/posters/d2r-server-iswc2006.png"
+                                                         title="D2R Server – Publishing Relational Databases on the Web (ISWC2006)"
+                                                         alt="Poster thumbnail"/></a>
+    <a href="/2008/posters/ng4j-eswc2005.pdf"><img src="/2008/posters/ng4j-eswc2005.png"
+                                                   title="NG4J – Named Graphs API for Jena (ESWC2005)"
+                                                   alt="Poster thumbnail"/></a>
+    <a href="/2008/posters/d2rq-iswc2004.pdf"><img src="/2008/posters/d2rq-iswc2004.png"
+                                                   title="D2RQ – Treating Non-RDF Databases as Virtual RDF Graphs (ISWC2004)"
+                                                   alt="Poster thumbnail"/></a>
+</p>
+
+
+<h2>Event organizer</h2>
+
+<ul rel="swc:holdsRole">
+    <li typeof="swc:MetadataChair">Metadata co-chair, <span rel="swc:isRoleAt"
+                                                            resource="http://data.semanticweb.org/conference/iswc/2009"><a
+            property="rdfs:label" rel="foaf:homepage" href="http://iswc2009.semanticweb.org/">International Semantic Web
+        Conference 2009</a> (ISWC2009)</span></li>
+    <li typeof="swc:WorkshopOrganiser">Co-organizer, <span rel="swc:isRoleAt"><a property="rdfs:label"
+                                                                                 rel="foaf:homepage"
+                                                                                 href="http://vocamp.org/wiki/VoCampOxford2008">VoCamp
+        Oxford 2008</a></span></li>
+    <li typeof="swc:WorkshopOrganiser">Co-organizer, <span rel="swc:isRoleAt"><a property="rdfs:label"
+                                                                                 rel="foaf:homepage"
+                                                                                 href="http://vocamp.org/wiki/VoCampGalway2008">VoCamp
+        Galway 2008</a></span></li>
+    <li typeof="swc:MetadataChair">Metadata co-chair, <span rel="swc:isRoleAt"
+                                                            resource="http://data.semanticweb.org/conference/iswc/2008"><a
+            property="rdfs:label" rel="foaf:homepage" href="http://iswc2008.semanticweb.org/">International Semantic Web
+        Conference 2008</a> (ISWC2008)</span></li>
+    <li typeof="swc:WorkshopOrganiser">Co-organizer, <span rel="swc:isRoleAt"><a property="rdfs:label"
+                                                                                 rel="foaf:homepage"
+                                                                                 href="http://www.semanticdesktop.org/xwiki/bin/view/Wiki/SemDeskHandsOn2007April">Semantic
+        Desktop Hands-on Workshop 2007</a></span></li>
+</ul>
+
+
+<h2>PC memberships</h2>
+
+<ul rel="swc:holdsRole">
+    <li typeof="swc:PCMember">Workshop: <span rel="swc:isRoleAt"><a property="rdfs:label" rel="foaf:homepage"
+                                                                    href="http://events.linkeddata.org/ldow2009/">Linked
+        Data on the Web</a> (LDOW2009)</span></li>
+    <li typeof="swc:PCMember">Conference: <span rel="swc:isRoleAt"><a property="rdfs:label" rel="foaf:homepage"
+                                                                      href="http://i-semantics.tugraz.at/conference">I-Semantics
+        2009</a></span></li>
+    <li typeof="swc:PCMember">Workshop: <span rel="swc:isRoleAt"><a property="rdfs:label" rel="foaf:homepage"
+                                                                    href="http://sdow2008.semanticweb.org/">Social Data
+        on the Web</a> (SDoW2008)</span></li>
+    <li typeof="swc:PCMember">Conference: <span rel="swc:isRoleAt"><a property="rdfs:label" rel="foaf:homepage"
+                                                                      href="http://i-know.tugraz.at/previous_conferences/i_semantics_08">I-Semantics
+        2008</a></span></li>
+    <li typeof="swc:PCMember">Workshop: <span rel="swc:isRoleAt"><a property="rdfs:label" rel="foaf:homepage"
+                                                                    href="http://events.linkeddata.org/ldow2008/">Linked
+        Data on the Web</a> (LDOW2008)</span></li>
+    <li typeof="swc:PCMember">Workshop: <span rel="swc:isRoleAt"><a property="rdfs:label" rel="foaf:homepage"
+                                                                    href="http://www.semanticscripting.org/SFSW2008/">4th
+        Workshop on Scripting for the Semantic Web</a> (SFSW2008)</span></li>
+    <li typeof="swc:PCMember">Workshop: <span rel="swc:isRoleAt"><a property="rdfs:label" rel="foaf:homepage"
+                                                                    href="http://www.okkam.org/IRSW2008">Identity and
+        Reference on the Semantic Web</a> (IRSW2008)</span></li>
+    <li typeof="swc:PCMember">Conference: <span rel="swc:isRoleAt"><a property="rdfs:label" rel="foaf:homepage"
+                                                                      href="http://aksw.org/SocialSemanticWebConference">SABRE
+        Conference on Social Semantic Web</a> (CSSW2007)</span></li>
+    <li typeof="swc:PCMember">Workshop: <span rel="swc:isRoleAt"><a property="rdfs:label" rel="foaf:homepage"
+                                                                    href="http://www.semanticscripting.org/SFSW2007/">3rd
+        Workshop on Scripting for the Semantic Web</a> (SFSW2007)</span></li>
+    <li typeof="swc:PCMember">Conference: <span rel="swc:isRoleAt"><a property="rdfs:label" rel="foaf:homepage"
+                                                                      href="http://www.hpl.hp.com/conferences/juc2007/">Jena
+        User Conference 2007</a> (JUC2007)</span></li>
+    <li typeof="swc:PCMember">Conference: <span rel="swc:isRoleAt"><a property="rdfs:label" rel="foaf:homepage"
+                                                                      href="http://jena.hpl.hp.com/juc2006/">Jena User
+        Conference 2006</a> (JUC2006)</span></li>
+</ul>
+
+<h2>Data</h2>
+
+<p><a href="http://www.w3.org/2007/08/pyRdfa/extract?uri=http%3A%2F%2Frichard.cyganiak.de%2F"><img
+        src="images/sw-rdfa-orange.png" alt="[RDFa logo]" title="RDFa data extracted from this homepage"/></a></p>
+
+</body>
+</html>

Added: incubator/any23/trunk/test-resources/src/test/resources/html/rdfa/rel-href.html
URL: http://svn.apache.org/viewvc/incubator/any23/trunk/test-resources/src/test/resources/html/rdfa/rel-href.html?rev=1371537&view=auto
==============================================================================
--- incubator/any23/trunk/test-resources/src/test/resources/html/rdfa/rel-href.html (added)
+++ incubator/any23/trunk/test-resources/src/test/resources/html/rdfa/rel-href.html Fri Aug 10 00:40:13 2012
@@ -0,0 +1,25 @@
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+
+   http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<html xmlns="http://www.w3.org/1999/xhtml">
+<head></head>
+<body>
+<div prefix="foaf:http://xmlns.com/foaf/0.1/" about="#me">
+   My name is <span property="foaf:name">John Doe</span> and my blog is called
+   <a rel="foaf:homepage" href="http://example.org/blog/">Understanding Semantics</a>.
+</div>
+</body>
+</html>
\ No newline at end of file

Added: incubator/any23/trunk/test-resources/src/test/resources/html/rdfa/rel-rev.html
URL: http://svn.apache.org/viewvc/incubator/any23/trunk/test-resources/src/test/resources/html/rdfa/rel-rev.html?rev=1371537&view=auto
==============================================================================
--- incubator/any23/trunk/test-resources/src/test/resources/html/rdfa/rel-rev.html (added)
+++ incubator/any23/trunk/test-resources/src/test/resources/html/rdfa/rel-rev.html Fri Aug 10 00:40:13 2012
@@ -0,0 +1,29 @@
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+
+   http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<html xmlns="http://www.w3.org/1999/xhtml">
+<head></head>
+<body>
+As Gandalf the White said in
+<span rel="cite" resource="http://www.example.com/books/the_two_towers">
+    The Two Towers
+</span>,
+<quote xml:lang="en">"The hospitality of
+    your hall is somewhat lessened of late, Theoden King."
+</quote>
+<span rev="isChapterOf"><a href="http://path/to/chapter">Read the chapter</a></span>
+</body>
+</html>
\ No newline at end of file

Added: incubator/any23/trunk/test-resources/src/test/resources/html/rdfa/vocab.html
URL: http://svn.apache.org/viewvc/incubator/any23/trunk/test-resources/src/test/resources/html/rdfa/vocab.html?rev=1371537&view=auto
==============================================================================
--- incubator/any23/trunk/test-resources/src/test/resources/html/rdfa/vocab.html (added)
+++ incubator/any23/trunk/test-resources/src/test/resources/html/rdfa/vocab.html Fri Aug 10 00:40:13 2012
@@ -0,0 +1,25 @@
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+
+   http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<html xmlns="http://www.w3.org/1999/xhtml">
+<head></head>
+<body>
+<div vocab="http://xmlns.com/foaf/0.1/" about="#me">
+   My name is <span property="name">John Doe</span> and my blog is called
+   <a rel="homepage" href="http://example.org/blog/">Understanding Semantics</a>.
+</div>
+</body>
+</html>
\ No newline at end of file

Added: incubator/any23/trunk/test-resources/src/test/resources/html/rdfa/xmlliteral-datatype-test.html
URL: http://svn.apache.org/viewvc/incubator/any23/trunk/test-resources/src/test/resources/html/rdfa/xmlliteral-datatype-test.html?rev=1371537&view=auto
==============================================================================
--- incubator/any23/trunk/test-resources/src/test/resources/html/rdfa/xmlliteral-datatype-test.html (added)
+++ incubator/any23/trunk/test-resources/src/test/resources/html/rdfa/xmlliteral-datatype-test.html Fri Aug 10 00:40:13 2012
@@ -0,0 +1,33 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML+RDFa 1.0//EN"
+  "http://www.w3.org/MarkUp/DTD/xhtml-rdfa-1.dtd">
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+
+   http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" version="XHTML+RDFa 1.0" dir="ltr"
+  xmlns:foaf="http://xmlns.com/foaf/0.1/"
+  xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
+  xmlns:rdfs="http://www.w3.org/2000/01/rdf-schema#"
+  xmlns:xsd="http://www.w3.org/2001/XMLSchema#">
+
+<head></head>
+<body>
+<p>You searched for <strong>Einstein</strong>:</p>
+<p about="http://dbpedia.org/resource/Albert_Einstein">
+  <span property="foaf:name" datatype="rdf:XMLLiteral">Albert <strong>Einstein</strong></span>
+  (b. March 14, 1879, d. April 18, 1955) was a German-born theoretical physicist.
+</p>
+</body>
+</html>
\ No newline at end of file

Added: incubator/any23/trunk/test-resources/src/test/resources/html/rff-test.html
URL: http://svn.apache.org/viewvc/incubator/any23/trunk/test-resources/src/test/resources/html/rff-test.html?rev=1371537&view=auto
==============================================================================
--- incubator/any23/trunk/test-resources/src/test/resources/html/rff-test.html (added)
+++ incubator/any23/trunk/test-resources/src/test/resources/html/rff-test.html Fri Aug 10 00:40:13 2012
@@ -0,0 +1,130 @@
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+
+   http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<html 
+  xmlns:contact="http://www.w3.org/2001/vcard-rdf/3.0#">
+  <head>
+<meta name="ICBM" content="45.12345, 45.65432"/>
+<meta name="geo.position" content="23.32;-23.32">
+<!-- stuff that should be ignored -->
+<link rel="stylesheet" type="text/css" media="print" href="/jira/s/300/1/_/styles/combined-printable.css">
+<link type="text/css" rel="StyleSheet" media="all" href="/jira/s/300/1/_/styles/combined.css"/>
+<link type="text/css" rel="StyleSheet" media="all" href="/jira/s/300/1/24/_/styles/global.css"/>
+    <title> Kewl title </title>
+  </head>
+  <body>
+
+    <a href="http://foo.com" rel="nofollow">crap </a>
+
+    <a href="http://bob.com" rel="me">my other blog </a>
+    <div>
+
+      <!-- stuff for pseudo rdfa -->
+      <div>
+        <p class="contactinfo" about="http://rdfa-user.org/staff/jo">
+        <span property="contact:fn">Jo Smith</span>.
+        <span property="contact:title">RDFa Professional</span>
+        at
+        <a rel="contact:org" href="http://example.org">
+          Example.org
+        </a>.
+        You can contact me
+        <a rel="contact:email" href="mailto:jo@example.org">
+          via email
+        </a>.
+        </p>
+      </div>
+      <div class="vcard">
+        <div style="text-align: center">
+          <object data="http://www.enterprise-component.com/images/datlogo.gif" class="logo">
+            <span class="org">Data Access Technologies</span>
+          </object><br />
+          <b class="fn n">
+            <span class="given-name">Cory</span
+              > <span class="additional-name">B.</span
+                > <span class="family-name">Casanave</span
+                  ></b>
+                <div class="title">President &amp; CEO</div>
+              </div>
+
+              <hr />
+              <table width="100%">
+                <tr>
+                  <td class="adr">
+                  </span>
+                  <div class="street-address">8605 Westwood Center Drive</div>
+                  <div class="extended-address">Suite 505</div>
+                  <span class="locality">Vienna</span>, 
+                  <span class="region">VA</span>, 
+                  <span class="postal-code">22182</span>
+                  <div class="country-name">USA</div>
+                </td>
+
+                <td style="text-align: right">
+                  <div class="tel">Phone: <span class="value">+1-123-456-7890</span></div>
+                  <div class="tel"><abbr class="type" title="cell">Mobile</abbr>: <span class="value">+1-111-555-7890</span></div>
+                  <div class="tel"><abbr class="type" title="fax">Fax</abbr>: <span class="value">+1-111-111-1234</span></div>
+
+                  <a class="email" href="mailto:cory@example">cory@example</a>
+                </td>
+              </tr>
+            </table>
+
+            <hr />
+
+            <p style="font-size:smaller;">This is an <a href="http://microformats.org/wiki/hcard">hCard</a>; the data come from a business card that Cory gave to Dan Connolly at ISWC; the email address and phone numbers have been scrubbed, but
+            the other data is published in a <a href="http://www.enterprise-component.com/company.shtml">company info page</a> so we figure it's OK to use it here.</p>
+            <p>Note the use of the <a href="http://www.w3.org/2006/03/hcard">http://www.w3.org/2006/03/hcard</a> profile, which may become obsolete soon.</p>
+          </div>
+
+
+          <div class="hreview">
+            <span><span class="rating">5</span> out of 5 stars</span>
+
+            <h4 class="summary">Crepes on Cole is awesome</h4>
+
+            <span class="reviewer vcard">Reviewer: 
+              <span class="fn">Tantek</span> - 
+              <abbr class="dtreviewed" title="20050418T2300-0700">April 18, 2005</abbr>
+            </span>
+            <div class="description item vcard">
+              <p>
+              <span class="fn org">Crepes on Cole</span> is one of the best little 
+              creperies in <span class="adr"><span class="locality">San Francisco</span></span>.
+              Excellent food and service. Plenty of tables in a variety of sizes 
+              for parties large and small.  Window seating makes for excellent 
+              people watching to/from the N-Judah which stops right outside.  
+              I've had many fun social gatherings here, as well as gotten 
+              plenty of work done thanks to neighborhood WiFi.
+              </p>
+            </div>
+            <p>Visit date: <span>April 2005</span></p>
+            <p>Food eaten: <span>Florentine crepe</span></p>
+          </div>
+
+          <!-- merry hcalendar -->
+          <div>
+
+            <div class="vevent">
+              <a class="url" href="http://www.web2con.com/">http://www.web2con.com/</a>
+              <span class="summary">Web 2.0 Conference</span>: 
+              <abbr class="dtstart" title="2007-10-05">October 5</abbr>-
+              <abbr class="dtend" title="2007-10-20">19</abbr>,
+              at the <span class="location">Argent Hotel, San Francisco, CA</span>
+            </div>
+          </div>
+        </body>
+      </html>

Added: incubator/any23/trunk/test-resources/src/test/resources/microdata/5.2.1-non-normative-example-1-expected.nquads
URL: http://svn.apache.org/viewvc/incubator/any23/trunk/test-resources/src/test/resources/microdata/5.2.1-non-normative-example-1-expected.nquads?rev=1371537&view=auto
==============================================================================
--- incubator/any23/trunk/test-resources/src/test/resources/microdata/5.2.1-non-normative-example-1-expected.nquads (added)
+++ incubator/any23/trunk/test-resources/src/test/resources/microdata/5.2.1-non-normative-example-1-expected.nquads Fri Aug 10 00:40:13 2012
@@ -0,0 +1,27 @@
+#
+#  Licensed to the Apache Software Foundation (ASF) under one or more
+#  contributor license agreements.  See the NOTICE file distributed with
+#  this work for additional information regarding copyright ownership.
+#  The ASF licenses this file to You under the Apache License, Version 2.0
+#  (the "License"); you may not use this file except in compliance with
+#  the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+#
+
+<http://books.example.com/works/45U8QJGZSQKDH8N> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <http://purl.org/vocab/frbr/core#Work> <http://bob.example.com/> .
+<http://books.example.com/works/45U8QJGZSQKDH8N> <http://purl.org/dc/elements/1.1/creator> "Wil Wheaton" <http://bob.example.com/> .
+<http://books.example.com/works/45U8QJGZSQKDH8N> <http://purl.org/dc/terms/title> "Just a Geek" <http://bob.example.com/> .
+<http://books.example.com/works/45U8QJGZSQKDH8N> <http://purl.org/vocab/frbr/core#realization> <http://books.example.com/products/9780596007683.BOOK> <http://bob.example.com/> .
+<http://books.example.com/works/45U8QJGZSQKDH8N> <http://purl.org/vocab/frbr/core#realization> <http://books.example.com/products/9780596802189.EBOOK> <http://bob.example.com/> .
+<http://books.example.com/products/9780596007683.BOOK> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <http://purl.org/vocab/frbr/core#Expression> <http://bob.example.com/> .
+<http://books.example.com/products/9780596007683.BOOK> <http://purl.org/dc/terms/type> <http://books.example.com/product-types/BOOK> <http://bob.example.com/> .
+<http://books.example.com/products/9780596802189.EBOOK> <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <http://purl.org/vocab/frbr/core#Expression> <http://bob.example.com/> .
+<http://books.example.com/products/9780596802189.EBOOK> <http://purl.org/dc/terms/type> <http://books.example.com/product-types/EBOOK> <http://bob.example.com/> .
+<http://bob.example.com/> <http://www.w3.org/1999/xhtml/microdata#item> <http://books.example.com/works/45U8QJGZSQKDH8N> <http://bob.example.com/> .
\ No newline at end of file

Added: incubator/any23/trunk/test-resources/src/test/resources/microdata/5.2.1-non-normative-example-1.html
URL: http://svn.apache.org/viewvc/incubator/any23/trunk/test-resources/src/test/resources/microdata/5.2.1-non-normative-example-1.html?rev=1371537&view=auto
==============================================================================
--- incubator/any23/trunk/test-resources/src/test/resources/microdata/5.2.1-non-normative-example-1.html (added)
+++ incubator/any23/trunk/test-resources/src/test/resources/microdata/5.2.1-non-normative-example-1.html Fri Aug 10 00:40:13 2012
@@ -0,0 +1,39 @@
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+
+   http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<dl itemscope
+    itemtype="http://purl.org/vocab/frbr/core#Work"
+    itemid="http://books.example.com/works/45U8QJGZSQKDH8N">
+    <dt>Title</dt>
+    <dd><cite itemprop="http://purl.org/dc/terms/title">Just a Geek</cite></dd>
+    <dt>By</dt>
+    <dd><span itemprop="http://purl.org/dc/elements/1.1/creator">Wil Wheaton</span></dd>
+    <dt>Format</dt>
+    <dd itemprop="http://purl.org/vocab/frbr/core#realization"
+        itemscope
+        itemtype="http://purl.org/vocab/frbr/core#Expression"
+        itemid="http://books.example.com/products/9780596007683.BOOK">
+        <link itemprop="http://purl.org/dc/terms/type" href="http://books.example.com/product-types/BOOK">
+        Print
+    </dd>
+    <dd itemprop="http://purl.org/vocab/frbr/core#realization"
+        itemscope
+        itemtype="http://purl.org/vocab/frbr/core#Expression"
+        itemid="http://books.example.com/products/9780596802189.EBOOK">
+        <link itemprop="http://purl.org/dc/terms/type" href="http://books.example.com/product-types/EBOOK">
+        Ebook
+    </dd>
+</dl>
\ No newline at end of file

Added: incubator/any23/trunk/test-resources/src/test/resources/microdata/5.2.1-non-normative-example-2-expected.nquads
URL: http://svn.apache.org/viewvc/incubator/any23/trunk/test-resources/src/test/resources/microdata/5.2.1-non-normative-example-2-expected.nquads?rev=1371537&view=auto
==============================================================================
--- incubator/any23/trunk/test-resources/src/test/resources/microdata/5.2.1-non-normative-example-2-expected.nquads (added)
+++ incubator/any23/trunk/test-resources/src/test/resources/microdata/5.2.1-non-normative-example-2-expected.nquads Fri Aug 10 00:40:13 2012
@@ -0,0 +1,32 @@
+#
+#  Licensed to the Apache Software Foundation (ASF) under one or more
+#  contributor license agreements.  See the NOTICE file distributed with
+#  this work for additional information regarding copyright ownership.
+#  The ASF licenses this file to You under the Apache License, Version 2.0
+#  (the "License"); you may not use this file except in compliance with
+#  the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+#
+
+<http://bob.example.com/> <http://www.w3.org/1999/xhtml/microdata#item> _:node161nd8236x293102 <http://bob.example.com/> .
+<http://bob.example.com/> <http://www.w3.org/1999/xhtml/microdata#item> _:node161nd8236x293103 <http://bob.example.com/> .
+_:node161nd8236x293102 <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <http://microformats.org/profile/hcard> <http://bob.example.com/> .
+_:node161nd8236x293102 <http://microformats.org/profile/hcard/fn> "Princeton" <http://bob.example.com/> .
+_:node161nd8236x293102 <http://microformats.org/profile/hcard/n> _:node161nd8236x293104 <http://bob.example.com/> .
+_:node161nd8236x293102 <http://microformats.org/profile/hcard/adr> _:node161nd8236x293105 <http://bob.example.com/> .
+_:node161nd8236x293104 <http://microformats.org/profile/hcard/given-name> "Princeton" <http://bob.example.com/> .
+_:node161nd8236x293103 <http://www.w3.org/1999/02/22-rdf-syntax-ns#type> <http://microformats.org/profile/hcard> <http://bob.example.com/> .
+_:node161nd8236x293103 <http://microformats.org/profile/hcard/fn> "Trekkie" <http://bob.example.com/> .
+_:node161nd8236x293103 <http://microformats.org/profile/hcard/n> _:node161nd8236x293106 <http://bob.example.com/> .
+_:node161nd8236x293103 <http://microformats.org/profile/hcard/adr> _:node161nd8236x293105 <http://bob.example.com/> .
+_:node161nd8236x293106 <http://microformats.org/profile/hcard/given-name> "Trekkie" <http://bob.example.com/> .
+_:node161nd8236x293105 <http://microformats.org/profile/hcard/street-address> "Avenue Q" <http://bob.example.com/> .
+<http://bob.example.com/> <http://vocab.sindice.net/date> "2011-06-08T12:56:39+01:00" <http://bob.example.com/> .
+<http://bob.example.com/> <http://vocab.sindice.net/size> "15"^^<http://www.w3.org/2001/XMLSchema#int> <http://bob.example.com/> .
\ No newline at end of file

Added: incubator/any23/trunk/test-resources/src/test/resources/microdata/5.2.1-non-normative-example-2.html
URL: http://svn.apache.org/viewvc/incubator/any23/trunk/test-resources/src/test/resources/microdata/5.2.1-non-normative-example-2.html?rev=1371537&view=auto
==============================================================================
--- incubator/any23/trunk/test-resources/src/test/resources/microdata/5.2.1-non-normative-example-2.html (added)
+++ incubator/any23/trunk/test-resources/src/test/resources/microdata/5.2.1-non-normative-example-2.html Fri Aug 10 00:40:13 2012
@@ -0,0 +1,26 @@
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+
+   http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<p>
+    Both
+ <span itemscope itemtype="http://microformats.org/profile/hcard" itemref="home"><span itemprop="fn"
+         ><span itemprop="n" itemscope><span itemprop="given-name">Princeton</span></span></span></span>
+    and
+ <span itemscope itemtype="http://microformats.org/profile/hcard" itemref="home"><span itemprop="fn"
+         ><span itemprop="n" itemscope><span itemprop="given-name">Trekkie</span></span></span></span>
+    live at
+    <span id="home" itemprop="adr" itemscope><span itemprop="street-address">Avenue Q</span>.</span>
+</p>
\ No newline at end of file

Added: incubator/any23/trunk/test-resources/src/test/resources/microdata/microdata-basic-expected.properties
URL: http://svn.apache.org/viewvc/incubator/any23/trunk/test-resources/src/test/resources/microdata/microdata-basic-expected.properties?rev=1371537&view=auto
==============================================================================
--- incubator/any23/trunk/test-resources/src/test/resources/microdata/microdata-basic-expected.properties (added)
+++ incubator/any23/trunk/test-resources/src/test/resources/microdata/microdata-basic-expected.properties Fri Aug 10 00:40:13 2012
@@ -0,0 +1,29 @@
+#
+#  Licensed to the Apache Software Foundation (ASF) under one or more
+#  contributor license agreements.  See the NOTICE file distributed with
+#  this work for additional information regarding copyright ownership.
+#  The ASF licenses this file to You under the Apache License, Version 2.0
+#  (the "License"); you may not use this file except in compliance with
+#  the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+#
+
+result0={ "xpath" : "/HTML[1]/BODY[1]/DIV[1]", "id" : null, "refs" : [], "type" : null, "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/P[1]/SPAN[1]", "name" : "name", "value" : { "content" : "Elizabeth", "type" : "Plain" } } ] }
+result1={ "xpath" : "/HTML[1]/BODY[1]/DIV[2]", "id" : null, "refs" : [], "type" : null, "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DIV[2]/P[1]/SPAN[1]", "name" : "name", "value" : { "content" : "Daniel", "type" : "Plain" } } ] }
+result2={ "xpath" : "/HTML[1]/BODY[1]/DIV[3]", "id" : null, "refs" : [], "type" : null, "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DIV[3]/P[2]/SPAN[1]", "name" : "band", "value" : { "content" : "Four Parts Water", "type" : "Plain" } }, { "xpath" : "/HTML[1]/BODY[1]/DIV[3]/P[3]/SPAN[1]", "name" : "nationality", "value" : { "content" : "British", "type" : "Plain" } }, { "xpath" : "/HTML[1]/BODY[1]/DIV[3]/P[1]/SPAN[1]", "name" : "name", "value" : { "content" : "Neil", "type" : "Plain" } } ] }
+result3={ "xpath" : "/HTML[1]/BODY[1]/DIV[4]", "id" : null, "refs" : [], "type" : null, "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DIV[4]/IMG[1]", "name" : "image", "value" : { "content" : "google-logo.png", "type" : "Link" } } ] }
+result4={ "xpath" : "/HTML[1]/BODY[1]/DIV[5]", "id" : null, "refs" : [], "type" : null, "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DIV[5]/TIME[1]", "name" : "birthday", "value" : { "content" : "2009-05-10", "type" : "Date" } } ] }
+result5={ "xpath" : "/HTML[1]/BODY[1]/DIV[6]", "id" : null, "refs" : [], "type" : null, "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DIV[6]/UL[1]/LI[1]", "name" : "flavor", "value" : { "content" : "Lemon sorbet", "type" : "Plain" } }, { "xpath" : "/HTML[1]/BODY[1]/DIV[6]/UL[1]/LI[2]", "name" : "flavor", "value" : { "content" : "Apricot sorbet", "type" : "Plain" } } ] }
+result6={ "xpath" : "/HTML[1]/BODY[1]/DIV[7]", "id" : null, "refs" : [], "type" : null, "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DIV[7]/SPAN[1]", "name" : "favorite-fruit", "value" : { "content" : "orange", "type" : "Plain" } }, { "xpath" : "/HTML[1]/BODY[1]/DIV[7]/SPAN[1]", "name" : "favorite-color", "value" : { "content" : "orange", "type" : "Plain" } } ] }
+result7={ "xpath" : "/HTML[1]/BODY[1]/FIGURE[1]/FIGCAPTION[1]/SPAN[1]", "id" : null, "refs" : [], "type" : null, "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/FIGURE[1]/FIGCAPTION[1]/SPAN[1]/SPAN[1]", "name" : "name", "value" : { "content" : "The Castle", "type" : "Plain" } } ] }
+result8={ "xpath" : "/HTML[1]/BODY[1]/SPAN[1]", "id" : null, "refs" : [], "type" : null, "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/SPAN[1]/META[1]", "name" : "name", "value" : { "content" : "The Castle", "type" : "Plain" } } ] }
+result9={ "xpath" : "/HTML[1]/BODY[1]/SECTION[1]", "id" : null, "refs" : [], "type" : "http://example.org/animals#cat", "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/SECTION[1]/P[1]", "name" : "desc", "value" : { "content" : "Hedral is a male american domestic shorthair,\\n     with a fluffy black fur with white paws and belly.", "type" : "Plain" } }, { "xpath" : "/HTML[1]/BODY[1]/SECTION[1]/H1[1]", "name" : "name", "value" : { "content" : "Hedral", "type" : "Plain" } }, { "xpath" : "/HTML[1]/BODY[1]/SECTION[1]/IMG[1]", "name" : "img", "value" : { "content" : "hedral.jpeg", "type" : "Link" } } ] }
+result10={ "xpath" : "/HTML[1]/BODY[1]/DL[1]", "id" : null, "refs" : [], "type" : "http://vocab.example.net/book", "itemid" : "urn:isbn:0-330-34032-8", "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DL[1]/DD[2]", "name" : "author", "value" : { "content" : "Peter F. Hamilton\\n    ", "type" : "Plain" } }, { "xpath" : "/HTML[1]/BODY[1]/DL[1]/DD[1]", "name" : "title", "value" : { "content" : "The Reality Dysfunction\\n    ", "type" : "Plain" } }, { "xpath" : "/HTML[1]/BODY[1]/DL[1]/DD[3]/TIME[1]", "name" : "pubdate", "value" : { "content" : "1996-01-26", "type" : "Date" } } ] }
+result11={ "xpath" : "/HTML[1]/BODY[1]/SECTION[2]", "id" : null, "refs" : [], "type" : "http://example.org/animals#cat", "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/SECTION[2]/P[1]", "name" : "desc", "value" : { "content" : "Hedral is a male american domestic shorthair, with a fluffy\\n        black fur with\\n        white paws and belly.", "type" : "Plain" } }, { "xpath" : "/HTML[1]/BODY[1]/SECTION[2]/H1[1]", "name" : "name", "value" : { "content" : "Hedral", "type" : "Plain" } }, { "xpath" : "/HTML[1]/BODY[1]/SECTION[2]/IMG[1]", "name" : "img", "value" : { "content" : "hedral.jpeg", "type" : "Link" } }, { "xpath" : "/HTML[1]/BODY[1]/SECTION[2]/H1[1]", "name" : "http://example.com/fn", "value" : { "content" : "Hedral", "type" : "Plain" } }, { "xpath" : "/HTML[1]/BODY[1]/SECTION[2]/P[1]/SPAN[1]", "name" : "http://example.com/color", "value" : { "content" : "black", "type" : "Plain" } }, { "xpath" : "/HTML[1]/BODY[1]/SECTION[2]/P[1]/SPAN[2]", "name" : "ht
 tp://example.com/color", "value" : { "content" : "white", "type" : "Plain" } } ] }
\ No newline at end of file

Added: incubator/any23/trunk/test-resources/src/test/resources/microdata/microdata-basic.html
URL: http://svn.apache.org/viewvc/incubator/any23/trunk/test-resources/src/test/resources/microdata/microdata-basic.html?rev=1371537&view=auto
==============================================================================
--- incubator/any23/trunk/test-resources/src/test/resources/microdata/microdata-basic.html (added)
+++ incubator/any23/trunk/test-resources/src/test/resources/microdata/microdata-basic.html Fri Aug 10 00:40:13 2012
@@ -0,0 +1,107 @@
+<!DOCTYPE html>
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+
+   http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<html>
+<head>
+<body>
+
+<!--  result0 -->
+<div itemscope>
+    <p>My name is <span itemprop="name">Elizabeth</span>.</p>
+</div>
+<!--  result1 -->
+<div itemscope>
+    <p>My name is <span itemprop="name">Daniel</span>.</p>
+</div>
+
+<!--  result2 -->
+<div itemscope>
+    <p>My name is <span itemprop="name">Neil</span>.</p>
+    <p>My band is called <span itemprop="band">Four Parts Water</span>.</p>
+    <p>I am <span itemprop="nationality">British</span>.</p>
+</div>
+
+<!--  result3 -->
+<div itemscope>
+    <img itemprop="image" src="google-logo.png" alt="Google">
+</div>
+
+<!--  result4 -->
+<div itemscope>
+ I was born on <time itemprop="birthday" datetime="2009-05-10">May 10th 2009</time>.
+</div>
+
+<!--  result5 -->
+<div itemscope>
+    <p>Flavors in my favorite ice cream:</p>
+    <ul>
+        <li itemprop="flavor">Lemon sorbet</li>
+        <li itemprop="flavor">Apricot sorbet</li>
+    </ul>
+</div>
+
+<!--  result6 -->
+<div itemscope>
+    <span itemprop="favorite-color favorite-fruit">orange</span>
+</div>
+
+<!--  result7 -->
+<figure>
+    <img src="castle.jpeg">
+    <figcaption><span itemscope><span itemprop="name">The Castle</span></span> (1986)</figcaption>
+</figure>
+
+<!--  result8 -->
+<span itemscope><meta itemprop="name" content="The Castle"></span>
+<figure>
+    <img src="castle.jpeg">
+    <figcaption>The Castle (1986)</figcaption>
+</figure>
+
+<!--  result9 -->
+<section itemscope itemtype="http://example.org/animals#cat">
+    <h1 itemprop="name">Hedral</h1>
+    <p itemprop="desc">Hedral is a male american domestic shorthair,
+     with a fluffy black fur with white paws and belly.</p>
+    <img itemprop="img" src="hedral.jpeg" alt="" title="Hedral, age 18 months">
+</section>
+
+<!--  result10 -->
+<dl itemscope
+    itemtype="http://vocab.example.net/book"
+    itemid="urn:isbn:0-330-34032-8">
+    <dt>Title
+    <dd itemprop="title">The Reality Dysfunction
+    <dt>Author
+    <dd itemprop="author">Peter F. Hamilton
+    <dt>Publication date
+    <dd>
+    <time itemprop="pubdate" datetime="1996-01-26">26 January 1996</time>
+</dl>
+
+<!--  result11 -->
+<section itemscope itemtype="http://example.org/animals#cat">
+    <h1 itemprop="name http://example.com/fn">Hedral</h1>
+    <p itemprop="desc">Hedral is a male american domestic shorthair, with a fluffy
+        <span itemprop="http://example.com/color">black</span> fur with
+        <span itemprop="http://example.com/color">white</span> paws and belly.</p>
+    <img itemprop="img" src="hedral.jpeg" alt="" title="Hedral, age 18 months">
+</section>
+
+</body>
+</head>
+</html>
\ No newline at end of file

Added: incubator/any23/trunk/test-resources/src/test/resources/microdata/microdata-itemref-expected.properties
URL: http://svn.apache.org/viewvc/incubator/any23/trunk/test-resources/src/test/resources/microdata/microdata-itemref-expected.properties?rev=1371537&view=auto
==============================================================================
--- incubator/any23/trunk/test-resources/src/test/resources/microdata/microdata-itemref-expected.properties (added)
+++ incubator/any23/trunk/test-resources/src/test/resources/microdata/microdata-itemref-expected.properties Fri Aug 10 00:40:13 2012
@@ -0,0 +1,25 @@
+#
+#  Licensed to the Apache Software Foundation (ASF) under one or more
+#  contributor license agreements.  See the NOTICE file distributed with
+#  this work for additional information regarding copyright ownership.
+#  The ASF licenses this file to You under the Apache License, Version 2.0
+#  (the "License"); you may not use this file except in compliance with
+#  the License.  You may obtain a copy of the License at
+#
+#   http://www.apache.org/licenses/LICENSE-2.0
+#
+#  Unless required by applicable law or agreed to in writing, software
+#  distributed under the License is distributed on an "AS IS" BASIS,
+#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+#  See the License for the specific language governing permissions and
+#  limitations under the License.
+#
+
+result0={ "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[1]", "id" : "is1", "refs" : [], "type" : "http://type/IScopeType1", "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[1]/A[2]", "name" : "p4", "value" : { "content" : "http://www.domain.org/path/2", "type" : "Link" } }, { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[1]/P[2]", "name" : "p3", "value" : { "content" : "Some Text 2", "type" : "Plain" } }, { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[1]/P[1]", "name" : "p2", "value" : { "content" : "Some Text 1", "type" : "Plain" } }, { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[1]/A[1]", "name" : "p1", "value" : { "content" : "http://www.domain.org/path/1", "type" : "Link" } } ] }
+result1={ "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[2]", "id" : "is2", "refs" : ["ip5", "ip4", "ip3", "unexisting"], "type" : "http://type/IScopeType2", "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[2]/P[1]", "name" : "p6", "value" : { "content" : "Some Text 3", "type" : "Plain" } }, { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[2]/IMG[1]", "name" : "p5", "value" : { "content" : "http://source/dom/path", "type" : "Link" } }, { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[1]/A[2]", "name" : "p4", "value" : { "content" : "http://www.domain.org/path/2", "type" : "Link" } }, { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[1]/P[2]", "name" : "p3", "value" : { "content" : "Some Text 2", "type" : "Plain" } } ] }
+result2={ "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]", "id" : "loops", "refs" : [], "type" : null, "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[3]", "name" : "next", "value" : { "content" : { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[3]", "id" : "loop2", "refs" : ["loop3"], "type" : null, "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[4]", "name" : "next", "value" : { "content" : { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[4]", "id" : "loop3", "refs" : ["loop4"], "type" : null, "itemid" : null, "properties" : [  ] }, "type" : "Nested" } } ] }, "type" : "Nested" } }, { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[4]", "name" : "next", "value" : { "content" : { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[4]", "id" : "loop3", "refs" : ["loop4"], "type" : null, "itemid" : null, "properties" : [  ] }, "type" : "Nested" } }, { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[5]", "name" : "next", "value
 " : { "content" : { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[5]", "id" : "loop4", "refs" : ["loop2"], "type" : null, "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[3]", "name" : "next", "value" : { "content" : { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[3]", "id" : "loop2", "refs" : ["loop3"], "type" : null, "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[4]", "name" : "next", "value" : { "content" : { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[4]", "id" : "loop3", "refs" : ["loop4"], "type" : null, "itemid" : null, "properties" : [  ] }, "type" : "Nested" } } ] }, "type" : "Nested" } } ] }, "type" : "Nested" } }, { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[1]", "name" : "self", "value" : { "content" : { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[1]", "id" : "loop0", "refs" : ["loop0"], "type" : null, "itemid" : null, "properties" : [  ] }, "type" : "Nested" } }, { "xpath" : "/HTML[1]/BOD
 Y[1]/DIV[1]/DIV[3]/DIV[2]", "name" : "head", "value" : { "content" : { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[2]", "id" : "loop1", "refs" : ["loop2"], "type" : null, "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[3]", "name" : "next", "value" : { "content" : { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[3]", "id" : "loop2", "refs" : ["loop3"], "type" : null, "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[4]", "name" : "next", "value" : { "content" : { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[4]", "id" : "loop3", "refs" : ["loop4"], "type" : null, "itemid" : null, "properties" : [  ] }, "type" : "Nested" } } ] }, "type" : "Nested" } } ] }, "type" : "Nested" } } ] }
+result3={ "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[4]/DIV[2]", "id" : "idItem", "refs" : ["insideOut"], "type" : null, "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[4]/DIV[2]/DIV[1]", "name" : "prop", "value" : { "content" : "Included via tree.", "type" : "Plain" } }, { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[4]/DIV[1]", "name" : "prop", "value" : { "content" : "Included via parent, before.", "type" : "Plain" } }, { "xpath" : "/HTML[1]/BODY[1]/DIV[1]/DIV[4]/DIV[3]", "name" : "prop", "value" : { "content" : "Included via parent, after.", "type" : "Plain" } } ] }
+error0={ "message" : "Unknown itemProp id 'unexisting'", "path" : "null", "begin_row" : -1, "begin_col" : -1, "end_row" : -1, "end_col" : -1 }
+error1={ "message" : "Duplicated deferred itemProp 'p5'.", "path" : "/HTML[1]/BODY[1]/DIV[1]/DIV[2]", "begin_row" : 26, "begin_col" : 5, "end_row" : 26, "end_col" : 97 }
+error2={ "message" : "Loop detected with depth 1 while dereferencing itemProp 'loop0' .", "path" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[1]", "begin_row" : 33, "begin_col" : 9, "end_row" : 33, "end_col" : 67 }
+error3={ "message" : "Loop detected with depth 3 while dereferencing itemProp 'loop2' .", "path" : "/HTML[1]/BODY[1]/DIV[1]/DIV[3]/DIV[5]", "begin_row" : 37, "begin_col" : 9, "end_row" : 37, "end_col" : 67 }
\ No newline at end of file

Added: incubator/any23/trunk/test-resources/src/test/resources/microdata/microdata-itemref.html
URL: http://svn.apache.org/viewvc/incubator/any23/trunk/test-resources/src/test/resources/microdata/microdata-itemref.html?rev=1371537&view=auto
==============================================================================
--- incubator/any23/trunk/test-resources/src/test/resources/microdata/microdata-itemref.html (added)
+++ incubator/any23/trunk/test-resources/src/test/resources/microdata/microdata-itemref.html Fri Aug 10 00:40:13 2012
@@ -0,0 +1,48 @@
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+
+   http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<div id="data">
+    <div id="is1" itemscope itemtype="http://type/IScopeType1">
+        <a id="ip1" itemprop="p1" href="http://www.domain.org/path/1"></a>
+        <p id="ip2" itemprop="p2">Some Text 1</p>
+        <p id="ip3" itemprop="p3">Some Text 2</p>
+        <a id="ip4" itemprop="p4" href="http://www.domain.org/path/2"></a>
+    </div>
+
+    <!-- Duplicate and unexisting itemrefs. -->
+    <div id="is2" itemscope itemtype="http://type/IScopeType2" itemref="ip5 ip4 ip3 unexisting">
+        <img id="ip5" itemprop="p5" src="http://source/dom/path">
+        <p   id="ip6" itemprop="p6">Some Text 3</p>
+    </div>
+
+    <!-- Loops. -->
+    <div id="loops" itemscope>
+        <div id="loop0" itemprop="self" itemscope itemref="loop0"></div>
+        <div id="loop1" itemprop="head" itemscope itemref="loop2">not in the loop</div>
+        <div id="loop2" itemprop="next" itemscope itemref="loop3"></div>
+        <div id="loop3" itemprop="next" itemscope itemref="loop4"></div>
+        <div id="loop4" itemprop="next" itemscope itemref="loop2"></div>
+    </div>
+
+    <!-- Inside - Out Nesting. -->
+    <div id="insideOut">
+        <div id="idBefore" itemprop="prop">Included via parent, before.</div>
+        <div id="idItem" itemscope itemref="insideOut">
+            <div id="ioChild" itemprop="prop">Included via tree.</div>
+        </div>
+        <div id="idAfter" itemprop="prop">Included via parent, after.</div>
+    </div>
+</div>

Added: incubator/any23/trunk/test-resources/src/test/resources/microdata/microdata-json-serialization.json
URL: http://svn.apache.org/viewvc/incubator/any23/trunk/test-resources/src/test/resources/microdata/microdata-json-serialization.json?rev=1371537&view=auto
==============================================================================
--- incubator/any23/trunk/test-resources/src/test/resources/microdata/microdata-json-serialization.json (added)
+++ incubator/any23/trunk/test-resources/src/test/resources/microdata/microdata-json-serialization.json Fri Aug 10 00:40:13 2012
@@ -0,0 +1 @@
+{ "result" : [{ "xpath" : "/HTML[1]/BODY[1]/DIV[1]", "id" : "amanda", "refs" : ["a", "b"], "type" : null, "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DIV[2]", "name" : "band", "value" : { "content" : { "xpath" : "/HTML[1]/BODY[1]/DIV[2]", "id" : "b", "refs" : ["c"], "type" : null, "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DIV[3]/P[1]/SPAN[1]", "name" : "name", "value" : { "content" : "Jazz Band", "type" : "Plain" } }, { "xpath" : "/HTML[1]/BODY[1]/DIV[3]/P[2]/SPAN[1]", "name" : "size", "value" : { "content" : "12", "type" : "Plain" } } ] }, "type" : "Nested" } }, { "xpath" : "/HTML[1]/BODY[1]/P[1]/SPAN[1]", "name" : "name", "value" : { "content" : "Amanda", "type" : "Plain" } } ] }, { "xpath" : "/HTML[1]/BODY[1]/DIV[4]", "id" : null, "refs" : [], "type" : "http://schema.org/Movie", "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DIV[4]/H1[1]", "name" : "name", "value" : { "content" : "Avatar", "type" : "Plain" } }, { 
 "xpath" : "/HTML[1]/BODY[1]/DIV[4]/DIV[1]", "name" : "director", "value" : { "content" : { "xpath" : "/HTML[1]/BODY[1]/DIV[4]/DIV[1]", "id" : null, "refs" : [], "type" : "http://schema.org/Person", "itemid" : null, "properties" : [ { "xpath" : "/HTML[1]/BODY[1]/DIV[4]/DIV[1]/SPAN[1]", "name" : "name", "value" : { "content" : "James Cameron", "type" : "Plain" } } ] }, "type" : "Nested" } } ] }] }
\ No newline at end of file



Mime
View raw message