You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@any23.apache.org by an...@apache.org on 2012/08/10 02:40:22 UTC

svn commit: r1371537 [22/30] - in /incubator/any23/trunk: ./ core/ core/src/test/java/org/apache/any23/ core/src/test/java/org/apache/any23/cli/ core/src/test/java/org/apache/any23/extractor/ core/src/test/java/org/apache/any23/extractor/csv/ core/src/...

Added: incubator/any23/trunk/test-resources/src/test/resources/microformats/hcard/37-singleton.html
URL: http://svn.apache.org/viewvc/incubator/any23/trunk/test-resources/src/test/resources/microformats/hcard/37-singleton.html?rev=1371537&view=auto
==============================================================================
--- incubator/any23/trunk/test-resources/src/test/resources/microformats/hcard/37-singleton.html (added)
+++ incubator/any23/trunk/test-resources/src/test/resources/microformats/hcard/37-singleton.html Fri Aug 10 00:40:13 2012
@@ -0,0 +1,49 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+        "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+
+   http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<html xmlns="http://www.w3.org/1999/xhtml">
+  <head>
+    <meta http-equiv="Content-type" content="text/html; charset=utf-8" />
+    <title>37-sington</title>
+    <link rel="alternate" href="37-sington.vcf" type="text/directory" />
+  </head>
+  <body>
+    <p class="vcard">
+      <span class="fn n"><span class="given-name">john</span> <span class="family-name"><span class="sort-string">d</span>oe</span> 1</span>
+      <span class="fn n"><span class="given-name"><span class="sort-string">j</span>ohn</span> <span class="family-name">doe</span> 2</span>
+
+      <abbr class="bday" title="20060707">today</abbr>
+      <abbr class="bday" title="20060708">tomorrow</abbr>
+
+      <abbr class="geo" title="123.45;67.89">Here</abbr>
+      <abbr class="geo" title="98.765;43.21">There</abbr>
+
+      <abbr class="rev" title="20060707">today</abbr>
+      <abbr class="rev" title="20060708">tomorrow</abbr>
+
+      <abbr class="uid" title="unique-id-1">id-1</abbr>
+      <abbr class="uid" title="unique-id-2">id-2</abbr>
+
+      <span class="tz">+0600</span>
+      <span class="tz">+0800</span>
+
+      <span class="class">public</span>
+      <span class="class">private</span>
+    </p>
+  </body>
+</html>
\ No newline at end of file

Added: incubator/any23/trunk/test-resources/src/test/resources/microformats/hcard/38-uid.html
URL: http://svn.apache.org/viewvc/incubator/any23/trunk/test-resources/src/test/resources/microformats/hcard/38-uid.html?rev=1371537&view=auto
==============================================================================
--- incubator/any23/trunk/test-resources/src/test/resources/microformats/hcard/38-uid.html (added)
+++ incubator/any23/trunk/test-resources/src/test/resources/microformats/hcard/38-uid.html Fri Aug 10 00:40:13 2012
@@ -0,0 +1,43 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+        "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+
+   http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<html xmlns="http://www.w3.org/1999/xhtml">
+  <head>
+    <meta http-equiv="Content-type" content="text/html; charset=utf-8" />
+    <title>38-uid</title>
+    <link rel="alternate" href="38-uid.vcf" type="text/directory" />
+  </head>
+  <body>
+    <div class="vcard">
+      <span class="fn">Ryan King</span>
+      <a class="url uid" href="http://theryanking.com/contact/">My other hCard</a>
+    </div>
+    <div class="vcard">
+      <span class="fn">Ryan King</span>
+      <object class="url uid" data="http://theryanking.com/contact/">My other hCard</object>
+    </div>
+    <div class="vcard">
+      <span class="fn">Ryan King</span>
+      <img class="url uid" src="http://theryanking.com/contact/" alt="my other hcard" />
+    </div>
+    <div class="vcard">
+      <span class="fn">Ryan King</span>
+      <map id="foo"><area class="url uid" href="http://theryanking.com/contact/" alt="my other hcard" /></map>
+    </div>
+  </body>
+</html>
\ No newline at end of file

Added: incubator/any23/trunk/test-resources/src/test/resources/microformats/hcard/40-fn-inside-adr.html
URL: http://svn.apache.org/viewvc/incubator/any23/trunk/test-resources/src/test/resources/microformats/hcard/40-fn-inside-adr.html?rev=1371537&view=auto
==============================================================================
--- incubator/any23/trunk/test-resources/src/test/resources/microformats/hcard/40-fn-inside-adr.html (added)
+++ incubator/any23/trunk/test-resources/src/test/resources/microformats/hcard/40-fn-inside-adr.html Fri Aug 10 00:40:13 2012
@@ -0,0 +1,115 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+        "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+
+   http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<html>
+<head>
+  <meta http-equiv="Content-type" content="text/html; charset=utf-8" />
+  <title>01-tantek-basic</title>
+  <link rel="alternate" href="01-tantek-basic.vcf" type="text/directory" />
+  <link rel="alternate" href="01-tantek-basic.vcf" type="text/directory" />
+</head>
+<body>
+
+<table class="infobox geography vcard" style="width: 270px;">
+<tr class="adr">
+<td colspan="2" align="center" style="background: #D8E2EF; width:100%; font-size: 1.25em; line-height: 1.2;"><b><span class="fn org">Berlin</span></b></td>
+</tr>
+<tr>
+<td colspan="2" style="text-align: center; padding: 0.0em 0.0em 0.0em 0.0em;;">
+<div class="floatnone"><span><a href="/wiki/Imagine:Cityscapeberlin2006.JPG" class="image" title="Cityscapeberlin2006.JPG"><img alt="" src="http://upload.wikimedia.org/wikipedia/commons/thumb/d/db/Cityscapeberlin2006.JPG/268px-Cityscapeberlin2006.JPG" width="268" height="158" border="0" /></a></span></div>
+</td>
+</tr>
+
+<tr>
+<td align="center" style="width: 50%; background:#D8E2EF;"><b>Stemă</b></td>
+<td align="center" style="width: 50%; background:#D8E2EF;"><b>Localizare</b></td>
+</tr>
+<tr>
+<td align="center" style="width: 50%; vertical-align: middle; padding: 0.2em 0.2em 0.2em 0.2em;"><a href="/wiki/Imagine:Flag_of_Berlin.svg" class="image" title="Stema Berlin"><img alt="Stema Berlin" src="http://upload.wikimedia.org/wikipedia/commons/thumb/e/ec/Flag_of_Berlin.svg/120px-Flag_of_Berlin.svg.png" width="120" height="72" border="0" /></a></td>
+<td align="center" style="width: 50%; vertical-align: top; padding: 0.2em 0.2em 0.2em 0.2em;">
+<div style="width: 112px; float:none; clear:both;">
+<div style="position: relative; padding: 0px; width: 110px"><a href="/wiki/Imagine:Karte_Deutschland.svg" class="image" title="Berlin (Germania)"><img alt="Berlin (Germania)" src="http://upload.wikimedia.org/wikipedia/commons/thumb/e/e3/Karte_Deutschland.svg/110px-Karte_Deutschland.svg.png" width="110" height="149" border="0" /></a><br />
+<div style="position: absolute; z-index: 2; top: 32.7%; left: 79.2%; height: 0; width: 0; margin: 0; padding: 0;">
+<div style="position: relative; text-align: center; left: -4px; top: -4px; width: 8px; font-size: 8px;"><a href="/wiki/Imagine:Red_pog.svg" class="image" title="Berlin"><img alt="Berlin" src="http://upload.wikimedia.org/wikipedia/commons/thumb/0/0c/Red_pog.svg/8px-Red_pog.svg.png" width="8" height="8" border="0" /></a></div>
+<div style="font-size: 90%; line-height: 110%; position: relative; top: -1.5em; width: 6em; left: 0.5em; text-align: left;"></div>
+</div>
+</div>
+<div style="font-size: 90%"></div>
+
+</div>
+</td>
+</tr>
+<tr>
+<td colspan="2" align="center" style="background:#D8E2EF;"><b>Administraţie</b></td>
+</tr>
+<tr class="mergedtoprow">
+<th><a href="/wiki/List%C4%83_de_state_suverane" title="Listă de state suverane">Ţară</a></th>
+<td><a href="/wiki/Germania" title="Germania">Germania</a> <a href="/wiki/Imagine:Flag_of_Germany.svg" class="image" title="Flag of Germany.svg"><img alt="" src="http://upload.wikimedia.org/wikipedia/commons/thumb/b/ba/Flag_of_Germany.svg/22px-Flag_of_Germany.svg.png" width="22" height="13" border="0" /></a></td>
+</tr>
+<tr class="mergedrow">
+<td><b><a href="/wiki/Landurile_Germaniei" title="Landurile Germaniei">Land</a></b></td>
+
+<td><strong class="selflink">Berlin</strong></td>
+</tr>
+<tr class="mergedrow">
+<td><b><a href="/wiki/Districtele_Germaniei" class="mw-redirect" title="Districtele Germaniei">District</a></b></td>
+<td><a href="/w/index.php?title=Kreifreistadt&amp;action=edit&amp;redlink=1" class="new" title="Kreifreistadt — pagină inexistentă">Kreifreistadt</a></td>
+</tr>
+<tr class="mergedbottomrow">
+<td><b><a href="/wiki/Partid_politic" title="Partid politic">Partide guvernante</a></b></td>
+<td>SPD /&#160;PDS</td>
+</tr>
+<tr class="mergedrow">
+
+<td>&#160;- <b><a href="/w/index.php?title=Suprafa%C5%A3%C4%83_urban%C4%83&amp;action=edit&amp;redlink=1" class="new" title="Suprafaţă urbană — pagină inexistentă">Urban</a></b></td>
+<td>3.700.000</td>
+</tr>
+<tr class="mergedrow">
+<td>&#160;- <b><a href="/w/index.php?title=Suprafa%C5%A3%C4%83_metropolitan%C4%83&amp;action=edit&amp;redlink=1" class="new" title="Suprafaţă metropolitană — pagină inexistentă">Metro</a></b></td>
+<td>4.262.480&#160;<small><i>(12/2004)</i></small></td>
+</tr>
+<tr>
+<td colspan="2" align="center" style="background:#D8E2EF;"><b>Alte informaţii</b></td>
+
+</tr>
+<tr class="mergedtoprow">
+<td><b><a href="/wiki/Fus_orar" title="Fus orar">Fus orar</a></b></td>
+<td><a href="/wiki/Ora_Europei_Centrale" title="Ora Europei Centrale">CET</a>/<a href="/w/index.php?title=Ora_de_var%C4%83_a_Europei_Centrale&amp;action=edit&amp;redlink=1" class="new" title="Ora de vară a Europei Centrale — pagină inexistentă">CEST</a> (<a href="/w/index.php?title=UTC%2B1&amp;action=edit&amp;redlink=1" class="new" title="UTC+1 — pagină inexistentă">UTC+1</a>/<a href="/wiki/UTC%2B2" title="UTC+2">+2</a>)</td>
+</tr>
+<tr class="mergedrow">
+<td><b>Număr de înmatriculare (auto)</b></td>
+
+<td>B</td>
+</tr>
+<tr class="mergedrow">
+<td><b>Cod poştal</b></td>
+<td>10001–14199</td>
+</tr>
+<tr class="mergedrow">
+<td><b>Cod zonal</b></td>
+<td>030</td>
+</tr>
+<tr class="mergedbottomrow">
+<td><b><a href="/wiki/Website" class="mw-redirect" title="Website">Website</a></b></td>
+
+<td><a href="http://www.berlin.de/english/index.html" class="external text" title="http://www.berlin.de/english/index.html" rel="nofollow">berlin.de</a> / <a href="http://www.3d-stadtmodell-berlin.de/3d/en/seite0.jsp" class="external text" title="http://www.3d-stadtmodell-berlin.de/3d/en/seite0.jsp" rel="nofollow">3D Berlin</a></td>
+</tr>
+</table>
+</body>
+
+</html>

Added: incubator/any23/trunk/test-resources/src/test/resources/microformats/hcard/41-ignore-children.html
URL: http://svn.apache.org/viewvc/incubator/any23/trunk/test-resources/src/test/resources/microformats/hcard/41-ignore-children.html?rev=1371537&view=auto
==============================================================================
--- incubator/any23/trunk/test-resources/src/test/resources/microformats/hcard/41-ignore-children.html (added)
+++ incubator/any23/trunk/test-resources/src/test/resources/microformats/hcard/41-ignore-children.html Fri Aug 10 00:40:13 2012
@@ -0,0 +1,79 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN"
+"http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+
+   http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
+<html xmlns="http://www.w3.org/1999/xhtml">
+  <head>
+    <meta http-equiv="Content-type" content="text/html; charset=utf-8" />
+    <title>38-uid</title>
+    <link rel="alternate" href="38-uid.vcf" type="text/directory" />
+  </head>
+  <body>
+
+    <div class="vcard">
+        <em>
+        <span class="url fn">
+        <a href="http://privpages.de"
+           onclick="pageTracker._trackPageview('/outgoing/privpages.de?referer=');">Melanie Klöß</a>
+        </span>
+        <br/>
+        <span class="adr"> <span class="type" style="display: none;">home</span>
+          <span class="street-address">Ippendorfer Weg. 24</span><br />
+          <span class="postal-code">53127</span> <span class="locality">Bonn</span><br />
+          <span class="country-name" style="display: none;">Germany</span>
+        </span>
+        </em>
+        <strong>mail</strong>:
+      <a class="email" href="mailto:mkloes@gmail.com">mkloes@gmail.com</a><br />
+      <strong>icq</strong>: 67296399, 65781370<br />
+      <strong>aim</strong>: caynea, oiseau3729<br />
+      <strong>y!</strong>: sumomo3729<br />
+      <strong>msn</strong>: chii3729@hotmail.com<br />
+      <strong>jabber</strong>: chise@amessage.de<br />
+      <strong>skype</strong>: nur auf Anfrage<br />
+      <strong>sonstiges</strong>: <a
+        href="http://www.amazon.de/gp/registry/38SWPRDM17NMH"
+        onclick="pageTracker._trackPageview('/outgoing/www.amazon.de/gp/registry/38SWPRDM17NMH?referer=');">Amazon</a>,
+      <a href="http://www.betamarker.com/users/sumomi"
+        onclick="pageTracker._trackPageview('/outgoing/www.betamarker.com/users/sumomi?referer=');">Beta
+        Marker</a>, <a href="http://www.box.net/public/gypt8822cs#main"
+        onclick="pageTracker._trackPageview('/outgoing/www.box.net/public/gypt8822cs_main?referer=');">Box.net</a>,
+      <a href="http://del.icio.us/sumomi"
+        onclick="pageTracker._trackPageview('/outgoing/del.icio.us/sumomi?referer=');">del.icio.us</a>,
+      <a href="http://sumomi.deviantart.com/"
+        onclick="pageTracker._trackPageview('/outgoing/sumomi.deviantart.com/?referer=');">deviantart</a>,
+      <a href="http://www.flickr.com/photos/sumomi"
+        onclick="pageTracker._trackPageview('/outgoing/www.flickr.com/photos/sumomi?referer=');">Flickr</a>,
+      <a href="http://www.last.fm/user/sumomi/"
+        onclick="pageTracker._trackPageview('/outgoing/www.last.fm/user/sumomi/?referer=');">Last.fm</a>,
+      <a href="http://www.librarything.com/catalog.php?view=chise&shelf=shelf"
+        onclick="pageTracker._trackPageview('/outgoing/www.librarything.com/catalog.php?view=chise_shelf=shelf&referer=');">LibraryThing</a>,
+      <a href="http://www.listible.com/user/chise"
+        onclick="pageTracker._trackPageview('/outgoing/www.listible.com/user/chise?referer=');">Listible</a>,
+      <a href="http://www.qype.com/people/sumomi?inviter=sumomi"
+        onclick="pageTracker._trackPageview('/outgoing/www.qype.com/people/sumomi?inviter=sumomi&referer=');">Qype</a>,
+      <a href="http://www.thisnext.com/by/oiseau/"
+        onclick="pageTracker._trackPageview('/outgoing/www.thisnext.com/by/oiseau/?referer=');">ThisNext</a>,
+      <a href="http://twitter.com/sumomi"
+        onclick="pageTracker._trackPageview('/outgoing/twitter.com/sumomi?referer=');">Twitter</a>,
+      <a href="http://www.wishlistr.com/sumomi"
+        onclick="pageTracker._trackPageview('/outgoing/www.wishlistr.com/sumomi?referer=');">Wishlistr</a>,
+      <a href="http://youtube.com/user/haquer"
+        onclick="pageTracker._trackPageview('/outgoing/youtube.com/user/haquer?referer=');">YouTube</a>
+    </div>
+  </body>
+</html>
\ No newline at end of file