You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@any23.apache.org by le...@apache.org on 2013/01/19 22:54:44 UTC

svn commit: r1435729 [3/3] - in /any23/trunk: ./ core/src/test/java/org/apache/any23/extractor/html/ mime/src/main/resources/org/apache/any23/mime/ plugins/basic-crawler/ plugins/office-scraper/ test-resources/src/test/resources/microformats/hcard/

Modified: any23/trunk/mime/src/main/resources/org/apache/any23/mime/tika-config.xml
URL: http://svn.apache.org/viewvc/any23/trunk/mime/src/main/resources/org/apache/any23/mime/tika-config.xml?rev=1435729&r1=1435728&r2=1435729&view=diff
==============================================================================
--- any23/trunk/mime/src/main/resources/org/apache/any23/mime/tika-config.xml (original)
+++ any23/trunk/mime/src/main/resources/org/apache/any23/mime/tika-config.xml Sat Jan 19 21:54:44 2013
@@ -16,5 +16,5 @@
   limitations under the License.
 -->
 <properties>
-    <mimeTypeRepository resource="/org/apache/any23/mime/mimetypes.xml" magic="false"/>
+    <mimeTypeRepository resource="/org/apache/any23/mime/any23-tika-1.2-mimetypes.xml" magic="false"/>
 </properties>
\ No newline at end of file

Modified: any23/trunk/plugins/basic-crawler/pom.xml
URL: http://svn.apache.org/viewvc/any23/trunk/plugins/basic-crawler/pom.xml?rev=1435729&r1=1435728&r2=1435729&view=diff
==============================================================================
--- any23/trunk/plugins/basic-crawler/pom.xml (original)
+++ any23/trunk/plugins/basic-crawler/pom.xml Sat Jan 19 21:54:44 2013
@@ -60,7 +60,7 @@
     <dependency>
       <groupId>edu.uci.ics</groupId>
       <artifactId>crawler4j</artifactId>
-      <version>3.3</version>
+      <version>3.4</version>
       <type>jar</type>
       <scope>compile</scope>
     </dependency>

Modified: any23/trunk/plugins/office-scraper/pom.xml
URL: http://svn.apache.org/viewvc/any23/trunk/plugins/office-scraper/pom.xml?rev=1435729&r1=1435728&r2=1435729&view=diff
==============================================================================
--- any23/trunk/plugins/office-scraper/pom.xml (original)
+++ any23/trunk/plugins/office-scraper/pom.xml Sat Jan 19 21:54:44 2013
@@ -52,7 +52,6 @@
     <dependency>
       <groupId>org.apache.poi</groupId>
       <artifactId>poi</artifactId>
-      <version>3.7</version>
     </dependency>
 
     <!-- BEGIN: plugins -->

Modified: any23/trunk/pom.xml
URL: http://svn.apache.org/viewvc/any23/trunk/pom.xml?rev=1435729&r1=1435728&r2=1435729&view=diff
==============================================================================
--- any23/trunk/pom.xml (original)
+++ any23/trunk/pom.xml Sat Jan 19 21:54:44 2013
@@ -278,7 +278,7 @@
       <dependency>
         <groupId>commons-codec</groupId>
         <artifactId>commons-codec</artifactId>
-        <version>1.3</version>
+        <version>1.6</version>
       </dependency>
       <dependency>
         <groupId>commons-cli</groupId>
@@ -286,21 +286,46 @@
         <version>1.2</version>
       </dependency>
       <dependency>
+        <groupId>org.apache.commons</groupId>
+        <artifactId>commons-compress</artifactId>
+        <version>1.4.1</version>
+      </dependency>
+      <dependency>
         <groupId>net.sourceforge.nekohtml</groupId>
         <artifactId>nekohtml</artifactId>
-        <version>1.9.14</version>
+        <version>1.9.15</version>
       </dependency>
 
       <!-- BEGIN: Tika -->
       <dependency>
         <groupId>org.apache.tika</groupId>
         <artifactId>tika-core</artifactId>
-        <version>0.6</version>
+        <version>1.2</version>
       </dependency>
       <dependency>
         <groupId>org.apache.tika</groupId>
         <artifactId>tika-parsers</artifactId>
-        <version>0.6</version>
+        <version>1.2</version>
+      </dependency>
+      <dependency>
+        <groupId>org.apache.poi</groupId>
+        <artifactId>poi</artifactId>
+        <version>3.8</version>
+      </dependency>
+      <dependency>
+        <groupId>org.apache.poi</groupId>
+        <artifactId>poi-ooxml</artifactId>
+        <version>3.8</version>
+      </dependency>
+      <dependency>
+        <groupId>org.apache.poi</groupId>
+        <artifactId>poi-ooxml-schemas</artifactId>
+        <version>3.8</version>
+      </dependency>
+      <dependency>
+        <groupId>org.apache.poi</groupId>
+        <artifactId>poi-scratchpad</artifactId>
+        <version>3.8</version>
       </dependency>
       <!-- END: Tika -->
 

Modified: any23/trunk/test-resources/src/test/resources/microformats/hcard/19-object-data-data-uri.html
URL: http://svn.apache.org/viewvc/any23/trunk/test-resources/src/test/resources/microformats/hcard/19-object-data-data-uri.html?rev=1435729&r1=1435728&r2=1435729&view=diff
==============================================================================
--- any23/trunk/test-resources/src/test/resources/microformats/hcard/19-object-data-data-uri.html (original)
+++ any23/trunk/test-resources/src/test/resources/microformats/hcard/19-object-data-data-uri.html Sat Jan 19 21:54:44 2013
@@ -25,7 +25,7 @@
   <body>
     <p class="vcard">
       <span class="fn">John Doe</span>
-      <object class="photo logo" data="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAADIAAAAyCAMAAAAp4XiDAAAABGdBTUEAAK/INwWK6QAAABl0RVh0U29mdHdhcmUAQWRvYmUgSW1hZ2VSZWFkeXHJZTwAAAASUExURf///8zMzJmZmWZmZjMzMwAAAPOPemkAAAM1SURBVHjaYmBgYGBkYQUBFkYWFiCPCchixQAMCCZAACF0MAMVM4K4TFh0IGsBCCAkOxhYmBnAAKaHhZkZmxaAAGJgYIbpYGBihGgBWsTMzMwE4jIhaWGAYoAAYmCECDExYAcwGxkg5oNIgABigDqLARdgZmGB2wICrKwAAcSA3xKgIxlZ0PwCEEAMBCxhgHoWSQtAADFAAxgfYEJ1GEAAQbQw4tUCsocBYQVAADEgu4uRkREeUCwszEwwLhOKLQABhNDCBA4aSDgwwhIAJKqYUPwCEEAMUK/AUwnc9aywJMCI7DAgAAggBohZ8JTBhGIJzCoWZL8ABBCYidAB8RUjWppkYUG2BSCAGMDqEMZiswUtXgACiAHsFYixTMywGGLGpgUWYgABxAA2mQkWCMyMqFoYmdD8ACQAAogBHJHMrCxg1cyIiICmCkYWDFsAAgiihYmZCewFFpR0BfI3LLch+QUggBiQ0iQjEyMDmh54qCBlUIAAYsCRJsElADQvgWKTlRGeKwECiAF3XgGmMEYQYADZzcoA9z5AAMG9RQCAtEC9DxBADFiyFyMjVi0wABBAWLQwQdIiuhYGWJIACCBg+KKUJ9BoBRdS2LQALQMIIGDQIEmwAO1kYcVWHCDZAhBAqFqYmOAxj2YNtAwDAYAAYmDEiBYWzHKKkRERYiwAAYSphZEZwxZGZiZQVEJTJkAAMTCyokc7M5oORlC5wcoEjxeAAAJqQXU0UB6W5WFmABMtEzMi1wEEEFAbE0YyAUuz
 MMEsYQalMkQSBQggUDmNPU3C9IA4LCxI+QUggEBiKOU8yExgqccCL3chnkPKlQABhGo6ejHBDKmdUHMlQAAhhQvQaGZGkBIkjcAMywLmI+VKgABCSowsTJhZkhlWXiBpAQggYBqBZl9GVOdBcz0LZqEEEEAMqLULMBLg1THWog9IAwQQA0qiZcRW5aPbAhBADCg1El4tMAAQQAxoiZYZXnTh1AIQQAzo2QlYpDDjcBgrxGEAAcSAJTthswmiBUwDBBC2GpkZJTaRvQ+mAQKIAUuuxdZWQvILQABBmSxMjBj5EpcWgACCMoFOYYSpZyHQHgMIMACt2hmoVEikCQAAAABJRU5ErkJggg==" />
+      <object class="photo logo" type="image/png" data="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAADIAAAAyCAMAAAAp4XiDAAAABGdBTUEAAK/INwWK6QAAABl0RVh0U29mdHdhcmUAQWRvYmUgSW1hZ2VSZWFkeXHJZTwAAAASUExURf///8zMzJmZmWZmZjMzMwAAAPOPemkAAAM1SURBVHjaYmBgYGBkYQUBFkYWFiCPCchixQAMCCZAACF0MAMVM4K4TFh0IGsBCCAkOxhYmBnAAKaHhZkZmxaAAGJgYIbpYGBihGgBWsTMzMwE4jIhaWGAYoAAYmCECDExYAcwGxkg5oNIgABigDqLARdgZmGB2wICrKwAAcSA3xKgIxlZ0PwCEEAMBCxhgHoWSQtAADFAAxgfYEJ1GEAAQbQw4tUCsocBYQVAADEgu4uRkREeUCwszEwwLhOKLQABhNDCBA4aSDgwwhIAJKqYUPwCEEAMUK/AUwnc9aywJMCI7DAgAAggBohZ8JTBhGIJzCoWZL8ABBCYidAB8RUjWppkYUG2BSCAGMDqEMZiswUtXgACiAHsFYixTMywGGLGpgUWYgABxAA2mQkWCMyMqFoYmdD8ACQAAogBHJHMrCxg1cyIiICmCkYWDFsAAgiihYmZCewFFpR0BfI3LLch+QUggBiQ0iQjEyMDmh54qCBlUIAAYsCRJsElADQvgWKTlRGeKwECiAF3XgGmMEYQYADZzcoA9z5AAMG9RQCAtEC9DxBADFiyFyMjVi0wABBAWLQwQdIiuhYGWJIACCBg+KKUJ9BoBRdS2LQALQMIIGDQIEmwAO1kYcVWHCDZAhBAqFqYmOAxj2YNtAwDAYAAYmDEiBYWzHKKkRERYiwAAYSphZEZwxZGZiZQVEJTJkAAMTCyokc7M5oORlC5wcoEjxeAAAJqQXU0UB6W5WFmABMtEzM
 i1wEEEFAbE0YyAUuzMMEsYQalMkQSBQggUDmNPU3C9IA4LCxI+QUggEBiKOU8yExgqccCL3chnkPKlQABhGo6ejHBDKmdUHMlQAAhhQvQaGZGkBIkjcAMywLmI+VKgABCSowsTJhZkhlWXiBpAQggYBqBZl9GVOdBcz0LZqEEEEAMqLULMBLg1THWog9IAwQQA0qiZcRW5aPbAhBADCg1El4tMAAQQAxoiZYZXnTh1AIQQAzo2QlYpDDjcBgrxGEAAcSAJTthswmiBUwDBBC2GpkZJTaRvQ+mAQKIAUuuxdZWQvILQABBmSxMjBj5EpcWgACCMoFOYYSpZyHQHgMIMACt2hmoVEikCQAAAABJRU5ErkJggg=="></object>
     </p>
   </body>
 </html>
\ No newline at end of file