You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@any23.apache.org by le...@apache.org on 2013/01/19 22:54:44 UTC
svn commit: r1435729 [3/3] - in /any23/trunk: ./
core/src/test/java/org/apache/any23/extractor/html/
mime/src/main/resources/org/apache/any23/mime/ plugins/basic-crawler/
plugins/office-scraper/ test-resources/src/test/resources/microformats/hcard/
Modified: any23/trunk/mime/src/main/resources/org/apache/any23/mime/tika-config.xml
URL: http://svn.apache.org/viewvc/any23/trunk/mime/src/main/resources/org/apache/any23/mime/tika-config.xml?rev=1435729&r1=1435728&r2=1435729&view=diff
==============================================================================
--- any23/trunk/mime/src/main/resources/org/apache/any23/mime/tika-config.xml (original)
+++ any23/trunk/mime/src/main/resources/org/apache/any23/mime/tika-config.xml Sat Jan 19 21:54:44 2013
@@ -16,5 +16,5 @@
limitations under the License.
-->
<properties>
- <mimeTypeRepository resource="/org/apache/any23/mime/mimetypes.xml" magic="false"/>
+ <mimeTypeRepository resource="/org/apache/any23/mime/any23-tika-1.2-mimetypes.xml" magic="false"/>
</properties>
\ No newline at end of file
Modified: any23/trunk/plugins/basic-crawler/pom.xml
URL: http://svn.apache.org/viewvc/any23/trunk/plugins/basic-crawler/pom.xml?rev=1435729&r1=1435728&r2=1435729&view=diff
==============================================================================
--- any23/trunk/plugins/basic-crawler/pom.xml (original)
+++ any23/trunk/plugins/basic-crawler/pom.xml Sat Jan 19 21:54:44 2013
@@ -60,7 +60,7 @@
<dependency>
<groupId>edu.uci.ics</groupId>
<artifactId>crawler4j</artifactId>
- <version>3.3</version>
+ <version>3.4</version>
<type>jar</type>
<scope>compile</scope>
</dependency>
Modified: any23/trunk/plugins/office-scraper/pom.xml
URL: http://svn.apache.org/viewvc/any23/trunk/plugins/office-scraper/pom.xml?rev=1435729&r1=1435728&r2=1435729&view=diff
==============================================================================
--- any23/trunk/plugins/office-scraper/pom.xml (original)
+++ any23/trunk/plugins/office-scraper/pom.xml Sat Jan 19 21:54:44 2013
@@ -52,7 +52,6 @@
<dependency>
<groupId>org.apache.poi</groupId>
<artifactId>poi</artifactId>
- <version>3.7</version>
</dependency>
<!-- BEGIN: plugins -->
Modified: any23/trunk/pom.xml
URL: http://svn.apache.org/viewvc/any23/trunk/pom.xml?rev=1435729&r1=1435728&r2=1435729&view=diff
==============================================================================
--- any23/trunk/pom.xml (original)
+++ any23/trunk/pom.xml Sat Jan 19 21:54:44 2013
@@ -278,7 +278,7 @@
<dependency>
<groupId>commons-codec</groupId>
<artifactId>commons-codec</artifactId>
- <version>1.3</version>
+ <version>1.6</version>
</dependency>
<dependency>
<groupId>commons-cli</groupId>
@@ -286,21 +286,46 @@
<version>1.2</version>
</dependency>
<dependency>
+ <groupId>org.apache.commons</groupId>
+ <artifactId>commons-compress</artifactId>
+ <version>1.4.1</version>
+ </dependency>
+ <dependency>
<groupId>net.sourceforge.nekohtml</groupId>
<artifactId>nekohtml</artifactId>
- <version>1.9.14</version>
+ <version>1.9.15</version>
</dependency>
<!-- BEGIN: Tika -->
<dependency>
<groupId>org.apache.tika</groupId>
<artifactId>tika-core</artifactId>
- <version>0.6</version>
+ <version>1.2</version>
</dependency>
<dependency>
<groupId>org.apache.tika</groupId>
<artifactId>tika-parsers</artifactId>
- <version>0.6</version>
+ <version>1.2</version>
+ </dependency>
+ <dependency>
+ <groupId>org.apache.poi</groupId>
+ <artifactId>poi</artifactId>
+ <version>3.8</version>
+ </dependency>
+ <dependency>
+ <groupId>org.apache.poi</groupId>
+ <artifactId>poi-ooxml</artifactId>
+ <version>3.8</version>
+ </dependency>
+ <dependency>
+ <groupId>org.apache.poi</groupId>
+ <artifactId>poi-ooxml-schemas</artifactId>
+ <version>3.8</version>
+ </dependency>
+ <dependency>
+ <groupId>org.apache.poi</groupId>
+ <artifactId>poi-scratchpad</artifactId>
+ <version>3.8</version>
</dependency>
<!-- END: Tika -->
Modified: any23/trunk/test-resources/src/test/resources/microformats/hcard/19-object-data-data-uri.html
URL: http://svn.apache.org/viewvc/any23/trunk/test-resources/src/test/resources/microformats/hcard/19-object-data-data-uri.html?rev=1435729&r1=1435728&r2=1435729&view=diff
==============================================================================
--- any23/trunk/test-resources/src/test/resources/microformats/hcard/19-object-data-data-uri.html (original)
+++ any23/trunk/test-resources/src/test/resources/microformats/hcard/19-object-data-data-uri.html Sat Jan 19 21:54:44 2013
@@ -25,7 +25,7 @@
<body>
<p class="vcard">
<span class="fn">John Doe</span>
- <object class="photo logo" data="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAADIAAAAyCAMAAAAp4XiDAAAABGdBTUEAAK/INwWK6QAAABl0RVh0U29mdHdhcmUAQWRvYmUgSW1hZ2VSZWFkeXHJZTwAAAASUExURf///8zMzJmZmWZmZjMzMwAAAPOPemkAAAM1SURBVHjaYmBgYGBkYQUBFkYWFiCPCchixQAMCCZAACF0MAMVM4K4TFh0IGsBCCAkOxhYmBnAAKaHhZkZmxaAAGJgYIbpYGBihGgBWsTMzMwE4jIhaWGAYoAAYmCECDExYAcwGxkg5oNIgABigDqLARdgZmGB2wICrKwAAcSA3xKgIxlZ0PwCEEAMBCxhgHoWSQtAADFAAxgfYEJ1GEAAQbQw4tUCsocBYQVAADEgu4uRkREeUCwszEwwLhOKLQABhNDCBA4aSDgwwhIAJKqYUPwCEEAMUK/AUwnc9aywJMCI7DAgAAggBohZ8JTBhGIJzCoWZL8ABBCYidAB8RUjWppkYUG2BSCAGMDqEMZiswUtXgACiAHsFYixTMywGGLGpgUWYgABxAA2mQkWCMyMqFoYmdD8ACQAAogBHJHMrCxg1cyIiICmCkYWDFsAAgiihYmZCewFFpR0BfI3LLch+QUggBiQ0iQjEyMDmh54qCBlUIAAYsCRJsElADQvgWKTlRGeKwECiAF3XgGmMEYQYADZzcoA9z5AAMG9RQCAtEC9DxBADFiyFyMjVi0wABBAWLQwQdIiuhYGWJIACCBg+KKUJ9BoBRdS2LQALQMIIGDQIEmwAO1kYcVWHCDZAhBAqFqYmOAxj2YNtAwDAYAAYmDEiBYWzHKKkRERYiwAAYSphZEZwxZGZiZQVEJTJkAAMTCyokc7M5oORlC5wcoEjxeAAAJqQXU0UB6W5WFmABMtEzMi1wEEEFAbE0YyAUuz
MMEsYQalMkQSBQggUDmNPU3C9IA4LCxI+QUggEBiKOU8yExgqccCL3chnkPKlQABhGo6ejHBDKmdUHMlQAAhhQvQaGZGkBIkjcAMywLmI+VKgABCSowsTJhZkhlWXiBpAQggYBqBZl9GVOdBcz0LZqEEEEAMqLULMBLg1THWog9IAwQQA0qiZcRW5aPbAhBADCg1El4tMAAQQAxoiZYZXnTh1AIQQAzo2QlYpDDjcBgrxGEAAcSAJTthswmiBUwDBBC2GpkZJTaRvQ+mAQKIAUuuxdZWQvILQABBmSxMjBj5EpcWgACCMoFOYYSpZyHQHgMIMACt2hmoVEikCQAAAABJRU5ErkJggg==" />
+ <object class="photo logo" type="image/png" data="data:image/png;base64,iVBORw0KGgoAAAANSUhEUgAAADIAAAAyCAMAAAAp4XiDAAAABGdBTUEAAK/INwWK6QAAABl0RVh0U29mdHdhcmUAQWRvYmUgSW1hZ2VSZWFkeXHJZTwAAAASUExURf///8zMzJmZmWZmZjMzMwAAAPOPemkAAAM1SURBVHjaYmBgYGBkYQUBFkYWFiCPCchixQAMCCZAACF0MAMVM4K4TFh0IGsBCCAkOxhYmBnAAKaHhZkZmxaAAGJgYIbpYGBihGgBWsTMzMwE4jIhaWGAYoAAYmCECDExYAcwGxkg5oNIgABigDqLARdgZmGB2wICrKwAAcSA3xKgIxlZ0PwCEEAMBCxhgHoWSQtAADFAAxgfYEJ1GEAAQbQw4tUCsocBYQVAADEgu4uRkREeUCwszEwwLhOKLQABhNDCBA4aSDgwwhIAJKqYUPwCEEAMUK/AUwnc9aywJMCI7DAgAAggBohZ8JTBhGIJzCoWZL8ABBCYidAB8RUjWppkYUG2BSCAGMDqEMZiswUtXgACiAHsFYixTMywGGLGpgUWYgABxAA2mQkWCMyMqFoYmdD8ACQAAogBHJHMrCxg1cyIiICmCkYWDFsAAgiihYmZCewFFpR0BfI3LLch+QUggBiQ0iQjEyMDmh54qCBlUIAAYsCRJsElADQvgWKTlRGeKwECiAF3XgGmMEYQYADZzcoA9z5AAMG9RQCAtEC9DxBADFiyFyMjVi0wABBAWLQwQdIiuhYGWJIACCBg+KKUJ9BoBRdS2LQALQMIIGDQIEmwAO1kYcVWHCDZAhBAqFqYmOAxj2YNtAwDAYAAYmDEiBYWzHKKkRERYiwAAYSphZEZwxZGZiZQVEJTJkAAMTCyokc7M5oORlC5wcoEjxeAAAJqQXU0UB6W5WFmABMtEzM
i1wEEEFAbE0YyAUuzMMEsYQalMkQSBQggUDmNPU3C9IA4LCxI+QUggEBiKOU8yExgqccCL3chnkPKlQABhGo6ejHBDKmdUHMlQAAhhQvQaGZGkBIkjcAMywLmI+VKgABCSowsTJhZkhlWXiBpAQggYBqBZl9GVOdBcz0LZqEEEEAMqLULMBLg1THWog9IAwQQA0qiZcRW5aPbAhBADCg1El4tMAAQQAxoiZYZXnTh1AIQQAzo2QlYpDDjcBgrxGEAAcSAJTthswmiBUwDBBC2GpkZJTaRvQ+mAQKIAUuuxdZWQvILQABBmSxMjBj5EpcWgACCMoFOYYSpZyHQHgMIMACt2hmoVEikCQAAAABJRU5ErkJggg=="></object>
</p>
</body>
</html>
\ No newline at end of file