You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@tika.apache.org by ta...@apache.org on 2023/08/23 13:50:50 UTC
[tika] branch main updated: rat plugin fixes in prep for 2.9.0-rc1
This is an automated email from the ASF dual-hosted git repository.
tallison pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/tika.git
The following commit(s) were added to refs/heads/main by this push:
new f285d4f0f rat plugin fixes in prep for 2.9.0-rc1
f285d4f0f is described below
commit f285d4f0f2f9439ed9807339164ae7b846c380b2
Author: tallison <ta...@apache.org>
AuthorDate: Wed Aug 23 09:50:34 2023 -0400
rat plugin fixes in prep for 2.9.0-rc1
---
.../resources/test-documents/undeclared_entity.xml | 18 ++++++++++++++++++
.../tika-parsers-ml/tika-age-recogniser/pom.xml | 1 +
.../tika-parsers-ml/tika-parser-nlp-module/pom.xml | 14 ++++++++++++++
.../src/test/resources/test-documents/testTEI.xml | 16 ++++++++++++++++
.../tika-parser-image-module/pom.xml | 9 +++++++++
5 files changed, 58 insertions(+)
diff --git a/tika-core/src/test/resources/test-documents/undeclared_entity.xml b/tika-core/src/test/resources/test-documents/undeclared_entity.xml
index 9996842c8..d389f40ba 100644
--- a/tika-core/src/test/resources/test-documents/undeclared_entity.xml
+++ b/tika-core/src/test/resources/test-documents/undeclared_entity.xml
@@ -1,4 +1,22 @@
<?xml version="1.0" encoding="UTF-8" ?>
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one
+ or more contributor license agreements. See the NOTICE file
+ distributed with this work for additional information
+ regarding copyright ownership. The ASF licenses this file
+ to you under the Apache License, Version 2.0 (the
+ "License"); you may not use this file except in compliance
+ with the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing,
+ software distributed under the License is distributed on an
+ "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ KIND, either express or implied. See the License for the
+ specific language governing permissions and limitations
+ under the License.
+-->
<address>
<company>START</company>
<name>An entity here&undeclared_entity; is invalid!</name>
diff --git a/tika-parsers/tika-parsers-ml/tika-age-recogniser/pom.xml b/tika-parsers/tika-parsers-ml/tika-age-recogniser/pom.xml
index 5c8a7e876..2ba7e2a31 100644
--- a/tika-parsers/tika-parsers-ml/tika-age-recogniser/pom.xml
+++ b/tika-parsers/tika-parsers-ml/tika-age-recogniser/pom.xml
@@ -203,6 +203,7 @@
<version>${rat.version}</version>
<configuration>
<excludes>
+ <exclude>model/opennlp/*.bin</exclude>
<exclude>model/org/apache/tika/parser/recognition/**</exclude>
</excludes>
</configuration>
diff --git a/tika-parsers/tika-parsers-ml/tika-parser-nlp-module/pom.xml b/tika-parsers/tika-parsers-ml/tika-parser-nlp-module/pom.xml
index 2b93cc390..f6065e3c1 100644
--- a/tika-parsers/tika-parsers-ml/tika-parser-nlp-module/pom.xml
+++ b/tika-parsers/tika-parsers-ml/tika-parser-nlp-module/pom.xml
@@ -146,6 +146,20 @@
</dependency>
</dependencies>
+ <build>
+ <plugins>
+ <plugin>
+ <groupId>org.apache.rat</groupId>
+ <artifactId>apache-rat-plugin</artifactId>
+ <version>${rat.version}</version>
+ <configuration>
+ <excludes>
+ <exclude>src/test/resources/org/apache/tika/parser/ner/opennlp/*.bin</exclude>
+ </excludes>
+ </configuration>
+ </plugin>
+ </plugins>
+ </build>
<profiles>
<profile>
<id>testSetup</id>
diff --git a/tika-parsers/tika-parsers-ml/tika-parser-nlp-module/src/test/resources/test-documents/testTEI.xml b/tika-parsers/tika-parsers-ml/tika-parser-nlp-module/src/test/resources/test-documents/testTEI.xml
index dcba59655..dc610319c 100644
--- a/tika-parsers/tika-parsers-ml/tika-parser-nlp-module/src/test/resources/test-documents/testTEI.xml
+++ b/tika-parsers/tika-parsers-ml/tika-parser-nlp-module/src/test/resources/test-documents/testTEI.xml
@@ -1,3 +1,19 @@
+<!--
+ Licensed to the Apache Software Foundation (ASF) under one or more
+ contributor license agreements. See the NOTICE file distributed with
+ this work for additional information regarding copyright ownership.
+ The ASF licenses this file to You under the Apache License, Version 2.0
+ (the "License"); you may not use this file except in compliance with
+ the License. You may obtain a copy of the License at
+
+ http://www.apache.org/licenses/LICENSE-2.0
+
+ Unless required by applicable law or agreed to in writing, software
+ distributed under the License is distributed on an "AS IS" BASIS,
+ WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ See the License for the specific language governing permissions and
+ limitations under the License.
+-->
<TEI xmlns="http://www.tei-c.org/ns/1.0"
xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
xsi:schemaLocation="http://www.tei-c.org/ns/1.0 C:\grobid\grobid-home/schemas/xsd/Grobid.xsd"
diff --git a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-image-module/pom.xml b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-image-module/pom.xml
index 99c7f3256..6f12dbaa0 100644
--- a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-image-module/pom.xml
+++ b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-image-module/pom.xml
@@ -90,6 +90,15 @@
</execution>
</executions>
</plugin>
+ <plugin>
+ <groupId>org.apache.rat</groupId>
+ <artifactId>apache-rat-plugin</artifactId>
+ <configuration>
+ <excludes>
+ <exclude>src/main/resources/**/properties</exclude>
+ </excludes>
+ </configuration>
+ </plugin>
</plugins>
</build>