You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@tika.apache.org by ta...@apache.org on 2023/08/23 13:50:50 UTC

[tika] branch main updated: rat plugin fixes in prep for 2.9.0-rc1

This is an automated email from the ASF dual-hosted git repository.

tallison pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/tika.git


The following commit(s) were added to refs/heads/main by this push:
     new f285d4f0f rat plugin fixes in prep for 2.9.0-rc1
f285d4f0f is described below

commit f285d4f0f2f9439ed9807339164ae7b846c380b2
Author: tallison <ta...@apache.org>
AuthorDate: Wed Aug 23 09:50:34 2023 -0400

    rat plugin fixes in prep for 2.9.0-rc1
---
 .../resources/test-documents/undeclared_entity.xml     | 18 ++++++++++++++++++
 .../tika-parsers-ml/tika-age-recogniser/pom.xml        |  1 +
 .../tika-parsers-ml/tika-parser-nlp-module/pom.xml     | 14 ++++++++++++++
 .../src/test/resources/test-documents/testTEI.xml      | 16 ++++++++++++++++
 .../tika-parser-image-module/pom.xml                   |  9 +++++++++
 5 files changed, 58 insertions(+)

diff --git a/tika-core/src/test/resources/test-documents/undeclared_entity.xml b/tika-core/src/test/resources/test-documents/undeclared_entity.xml
index 9996842c8..d389f40ba 100644
--- a/tika-core/src/test/resources/test-documents/undeclared_entity.xml
+++ b/tika-core/src/test/resources/test-documents/undeclared_entity.xml
@@ -1,4 +1,22 @@
 <?xml version="1.0" encoding="UTF-8" ?>
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one
+  or more contributor license agreements.  See the NOTICE file
+  distributed with this work for additional information
+  regarding copyright ownership.  The ASF licenses this file
+  to you under the Apache License, Version 2.0 (the
+  "License"); you may not use this file except in compliance
+  with the License.  You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing,
+  software distributed under the License is distributed on an
+  "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+  KIND, either express or implied.  See the License for the
+  specific language governing permissions and limitations
+  under the License.
+-->
 <address>
    <company>START</company>
    <name>An entity here&undeclared_entity; is invalid!</name>
diff --git a/tika-parsers/tika-parsers-ml/tika-age-recogniser/pom.xml b/tika-parsers/tika-parsers-ml/tika-age-recogniser/pom.xml
index 5c8a7e876..2ba7e2a31 100644
--- a/tika-parsers/tika-parsers-ml/tika-age-recogniser/pom.xml
+++ b/tika-parsers/tika-parsers-ml/tika-age-recogniser/pom.xml
@@ -203,6 +203,7 @@
         <version>${rat.version}</version>
         <configuration>
           <excludes>
+            <exclude>model/opennlp/*.bin</exclude>
             <exclude>model/org/apache/tika/parser/recognition/**</exclude>
           </excludes>
         </configuration>
diff --git a/tika-parsers/tika-parsers-ml/tika-parser-nlp-module/pom.xml b/tika-parsers/tika-parsers-ml/tika-parser-nlp-module/pom.xml
index 2b93cc390..f6065e3c1 100644
--- a/tika-parsers/tika-parsers-ml/tika-parser-nlp-module/pom.xml
+++ b/tika-parsers/tika-parsers-ml/tika-parser-nlp-module/pom.xml
@@ -146,6 +146,20 @@
         </dependency>
     </dependencies>
 
+    <build>
+        <plugins>
+            <plugin>
+                <groupId>org.apache.rat</groupId>
+                <artifactId>apache-rat-plugin</artifactId>
+                <version>${rat.version}</version>
+                <configuration>
+                    <excludes>
+                        <exclude>src/test/resources/org/apache/tika/parser/ner/opennlp/*.bin</exclude>
+                    </excludes>
+                </configuration>
+            </plugin>
+        </plugins>
+    </build>
     <profiles>
         <profile>
             <id>testSetup</id>
diff --git a/tika-parsers/tika-parsers-ml/tika-parser-nlp-module/src/test/resources/test-documents/testTEI.xml b/tika-parsers/tika-parsers-ml/tika-parser-nlp-module/src/test/resources/test-documents/testTEI.xml
index dcba59655..dc610319c 100644
--- a/tika-parsers/tika-parsers-ml/tika-parser-nlp-module/src/test/resources/test-documents/testTEI.xml
+++ b/tika-parsers/tika-parsers-ml/tika-parser-nlp-module/src/test/resources/test-documents/testTEI.xml
@@ -1,3 +1,19 @@
+<!--
+  Licensed to the Apache Software Foundation (ASF) under one or more
+  contributor license agreements.  See the NOTICE file distributed with
+  this work for additional information regarding copyright ownership.
+  The ASF licenses this file to You under the Apache License, Version 2.0
+  (the "License"); you may not use this file except in compliance with
+  the License.  You may obtain a copy of the License at
+
+  http://www.apache.org/licenses/LICENSE-2.0
+
+  Unless required by applicable law or agreed to in writing, software
+  distributed under the License is distributed on an "AS IS" BASIS,
+  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+  See the License for the specific language governing permissions and
+  limitations under the License.
+-->
 <TEI xmlns="http://www.tei-c.org/ns/1.0"
      xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
      xsi:schemaLocation="http://www.tei-c.org/ns/1.0 C:\grobid\grobid-home/schemas/xsd/Grobid.xsd"
diff --git a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-image-module/pom.xml b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-image-module/pom.xml
index 99c7f3256..6f12dbaa0 100644
--- a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-image-module/pom.xml
+++ b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-image-module/pom.xml
@@ -90,6 +90,15 @@
           </execution>
         </executions>
       </plugin>
+      <plugin>
+        <groupId>org.apache.rat</groupId>
+        <artifactId>apache-rat-plugin</artifactId>
+        <configuration>
+          <excludes>
+            <exclude>src/main/resources/**/properties</exclude>
+          </excludes>
+        </configuration>
+      </plugin>
     </plugins>
   </build>