You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@tika.apache.org by gi...@apache.org on 2022/05/21 17:08:31 UTC
[tika] branch dependabot/maven/org.glassfish.jaxb-jaxb-runtime-3.0.2 updated (0755c0957 -> 1888b1489)
This is an automated email from the ASF dual-hosted git repository.
github-bot pushed a change to branch dependabot/maven/org.glassfish.jaxb-jaxb-runtime-3.0.2
in repository https://gitbox.apache.org/repos/asf/tika.git
discard 0755c0957 Bump jaxb-runtime from 2.3.6 to 3.0.2
add c133e09fb Bump avro from 1.10.2 to 1.11.0 (#533)
add 6b81c564f Bump plexus-utils from 2.0.5 to 3.4.1 (#523)
add c93bac0cc TIKA-3675 general upgrades for 2.4.0
add 000abdcf7 TIKA-3695 (#534)
add 2da9c5d18 Bump jackrabbit.version from 2.21.9 to 2.21.10 (#535)
add de1835b75 TIKA-3675 - general upgrades for 2.4.0
add 0be171352 TIKA-3697 : add initial warc and wacz parsers
add 1260c0203 Merge remote-tracking branch 'origin/main' into main
add 0ceabfa14 Change metadata write limit to "warn" instead of "exception"
add 1d5f5afd0 Bump minor version...lots of changes since 2.3.0.
add 68fe7ff3f TIKA-3699 - Upgrade POI to 5.2.2.
add bdfd653d4 TIKA-3675 -- general upgrades for 2.4.0
add b2e18d388 TIKA-3695 -- further refactorings to add limits on key sizes and per field limits.
add 77ab34b17 Bump cxf.version from 3.5.0 to 3.5.1 (#537)
add 2a0f51ef0 TIKA-3695 -- fix serialization in tika-bundle forkparser test
add 9952019a5 TIKA-3695 -- add a minmax limit for the always add and always set fields. Add a max values per field setting.
add fbeab6c3f TIKA-3707 -- add fetcher and emitter for Azure blob storage
add 294539352 TIKA-3707 -- add fetcher and emitter for Azure blob storage -- add pipes iterator and clean up some other stuff.
add d6aa60f16 TIKA-3707 -- bump azure-storage-blob version
add f968b9dfb TIKA-3707 -- allow sending in the full sasurl per blob
add d3a4d6a7e TIKA-3675 -- bump jackson databind version and clean up jackson dependency mgmt.
add b14b4b1cd TIKA-3675 -- various other updates
add 950f3d9fa TIKA-3675 -- revert mistaken pdfbox snapshot commit
add 39adeeb2f Improve reporting organization in maven 3.5.x
add 4f3f88baf Bump versions-maven-plugin from 2.9.0 to 2.10.0 (#540)
add 1b33d7c87 Bump scala-reflect from 2.12.12 to 2.13.8 (#538)
add fd9cb684c update CHANGES.txt to include new /eval endpoint
add 283aa339b Merge remote-tracking branch 'origin/main' into main
add bd157e5b2 TIKA-3675
add 4fad47072 TIKA-3716 -- add a Parsed-By-Full-Set metadata key to record all parsers that touched a file.
add 984ce0e77 TIKA-3714 -- allow specification of fetchername and fetchkey in url parameters in tika-server
add ad29e809d TIKA-3715 -- push forking processes' env variables into forked process.
add 4e8a750c0 Update DetectorResource.java (#543)
add 031c9d16c Merge remote-tracking branch 'origin/main' into main
add fc896a45d fix checkstyle
add fa6c4baac TIKA-3717 -- add metadata filters for optimaize and opennlp lang detectors
add aa227bca7 TIKA-3675 -- general dependency upgrades for 2.4.0
add ccc7bd841 TIKA-3711 -- allow configuration of EmbeddedDocumentExtractors via tika-config.xml
add 6552b076f TIKA-3711 -- allow configuration of EmbeddedDocumentExtractors via tika-config.xml -- review and correct places where outputHtml should be false.
add 951ede5ce Bump jetty.version from 9.4.45.v20220203 to 9.4.46.v20220331 (#541)
add fa3389fe6 Bump maven-surefire-plugin from 3.0.0-M5 to 3.0.0-M6 (#544)
add 6e7bb2dfe Bump azure-storage-blob from 12.15.0 to 12.16.0 (#545)
add fe49555d8 Bump aws.version from 1.12.195 to 1.12.197 (#546)
add fb56aab33 Bump aws.version from 1.12.197 to 1.12.200 (#547)
add 23be41144 Bump FastInfoset from 2.0.0 to 2.1.0 (#548)
add 62af5295a TIKA-3666 -- add detection for files protected by Microsoft's Rights Management Service (RMS).
add 83b0de4d6 general code improvements
add d8113db2b TIKA-3666 -- add encrypted document exception if we haven't identified the file type and there is an EncryptedPackage.
add 7232fd4a0 TIKA-3723 -- Allow configurability of the ContentHandlerDecorator used by the AutoDetectParser.
add 9f204bfad TIKA-3724
add 4b20970cb TIKA-3724 - refactor AES initialization
add fc19baf5f Merge remote-tracking branch 'origin/main' into main
add 5386d61d5 TIKA-3726 -- upgrade PDFBox to 2.0.26
add cee0f15df TIKA-3721 -- add detection of dgn files via Steven Frew's tika-dgn-detector
add c1c69dac4 TIKA-3719 (#549)
add 00c2614b1 TIKA-3719 -- fix tests on Windows
add 0f7d9263d TIKA-3719 -- fix tests on Windows
add 742af7025 fix older, long broken tests on Windows
add 5b90009e7 fix assertion on error msg in two way tls test
add b8669229f TIKA-3719 -- log warning about beta stage of tls configuration
add c06968473 further attempts to fix windows build
add 4639e8d37 TIKA-3730
add 90c7e4c2d TIKA-3730 -- fix checkstyle; hang head in shame.
add 10a87151b general upgrades for 2.x
add 15909b432 TIKA-3733 -- pass parent metadata to AbstractPOIFSExtractor in OutlookExtractor
add 43d0434b8 TIKA-3734 -- avoid illegalargumentexception with zero byte streams
add 079db8d82 TIKA-3731 -- expand metadata extraction for DWG AC1027 and AC1032; add prefix for custom metadata
add 1d469867e TIKA-3721 -- add DGN8Parser for metadata via Dan Coldrick
add 8ff887fc2 TIKA-3721 -- add DGN8Parser for metadata via Dan Coldrick -- put unit test in correct package.
add 1e0a544fd TIKA-3675 -- general upgrades for 2.4.0
add fc05adb88 TIKA-3741 -- fix regression in handling embedded file exceptions in ppt
add 9fc04189c add branch_1x to github actions
add 403b7aef2 TIKA-3740 -- upgrade junrar
add f33d8930e PDP-11 style "Middle Endian" 32 bit read util, as used in the DGN file format
add bbd8eddba Merge remote-tracking branch 'origin/main' into main
add 3b322e96e fix workflow names for branch_1x
add 7d3911ece TIKA-3743 -- install
add d189d7bdb Update CHANGES.txt for X.Y.Z release.
add 3677bf669 [maven-release-plugin] prepare release 2.4.0-rc1
add 6e9d5c00d [maven-release-plugin] prepare for next development iteration
add c14de4f1a Merge remote-tracking branch 'origin/main' into main
add fad145d41 need to switch tasks -> target for major release upgrade for antrun
add 8faf9ae76 roll back version for second attempt at 2.4.0-rc1
add ac10b61ab TIKA-3745 -- turn off file names appearing in the streams for thumbnails and embedded images in odt.
add 740f70bb3 [maven-release-plugin] prepare release 2.4.0-rc1
add 8cf53d73a [maven-release-plugin] prepare for next development iteration
add 6fb5bb03c Merge remote-tracking branch 'origin/main' into main
add faa2f47e8 remove branch_1x workflows from main branch
add 8a56a9ad6 add branch_1x workflows back to main branch
add 33aa848cf TIKA-3748 -- allow expansion of system properties into forked process system properties.
add a02c195d1 Add an interface for rendering engines (#555)
add 8aef179f4 convert dev println into actual unit test...sorry.
add c8861d269 TIKA-3748 -- escape replacements correctly
add b9efda88a [TIKA-3749] upgrade maven-bundle-plugin (#556)
add cfa9a5274 TIKA-3750 -- add unit test
add 121fe480f TIKA-3750 -- add license header to pom.xml
add 6fb369308 fix typo in variable names
add 42da02ef1 TIKA-3750 - Fixed bug in ordering of Parsers during service loading.
add 91d389f06 add more debug logging to ExternalParser
add ba9fdc1b5 Merge remote-tracking branch 'origin/main' into main
add 99dc4885d add VectorGraphicsOnlyPDFRenderer
add dcec488a2 TIKA-3751 -- general upgrades for 2.4.1
add 43996149b back off to test in github actions
add b4c1c033f TIKA-3571 -- rollback puppycrawl -- requires java > 8
add 32a9c4d92 ci/cd still failing, try adding package?
add 6e83ee7f8 TIKA-3743 -- test rolling back bundle-plugin to see if github actions work
add 7424dace7 fix branch_1x workflow
add 1b9f0d9d9 TIKA-3751: update site plugin
add 2f703f9e1 TIKA-3751: update build plugins
add 0a6475d79 TIKA-3751: update plugins, remove option not suppported in jdk8
add 54c51cd00 TIKA-3751: revert maven.bundle.version to 5.1.4 due to build failures
add 0ee049f52 TIKA-3751: update netty
add 678898a9d TIKA-3571 -- cleanup
add 7d8ade1a0 TIKA-3572 -- fix duplicate logic branch in MidiParser
add 07a59ecd6 TIKA-3754 -- allow customization of ImageGraphicsEngine
add 87a3468fc TIKA-3754 -- allow easier customization of ImageGraphicsEngine
add 974506272 TIKA-3754 -- allow easier customization of ImageGraphicsEngine, add page number
add c3b489ab5 remove dodgy testStandardsExtractor.pdf
add f92dc3f9b TIKA-3751: update spring, improve comment
add e2a6d2513 Merge origin/main into main
add 8876fdf62 Merge remote-tracking branch 'origin/main' into main
add bf2d904e9 add resource loading tests back(?)
add 62de2a3ff fix MyCustomImageGraphicsEngineFactory
add 8ce439ce1 TIKA-3755 -- make renderresult more flexible to allow for an open container or an inputstream; add image strategy end of page
add 1dda56bd8 Bump netty-tcnative-classes from 2.0.51.Final to 2.0.52.Final
add 7b79e0b6e Merge remote-tracking branch 'origin/main' into main
add adf8dacf7 TIKA-3756
add d86eb703b TIKA-3760 -- migrate to junit5 in tika-eval
add de04c1cdd TIKA-3757 - migrate to junit5 in tika-translate
add 27b4273d0 TIKA-3761 - migrate to junit5 in tika-example
add 5bfdf933e migrate to junit5 in tika-java7
add 574e4defc TIKA-3758 -- upgrade to junit5 in tika-app
add 6bd1bd939 TIKA-3762 -- upgrade to junit5 in tika-xmp
add 6c1ec133f TIKA-3759 -- upgrade to junit5 in tika-batch
add 71c9f9f20 upgrade to junit5 in tika-fuzzing
add 84582534c upgrade to junit5 in tika-bundles
add f4a2960ed fix checkstyle
add ba631c095 TIKA-1570 -- add a stop method to TikaServerCli
add ca35eb2ae fix bad import
add 39d3ed513 TIKA-3755 -- bug fix need to adder renderer to userConfigured set
add 98cd7e650 TIKA-3759 -- fix unit test that fails on windows.
add 359ed9097 Bump aws.version from 1.12.214 to 1.12.220
add 3f9e7a3c5 TIKA-3763 -- make sure to close the ForkParser in TikaCLI and elsewhere.
add acfa13465 TIKA-3764 -- add unit tests for Solr 9
add 46d148fdc TIKA-3767 -- switch to @TempDir in TikaCLITest
add d67d69251 TIKA-3766: delete temporary directories, simplify temp directory generation
add 3fa217103 TIKA-3766: delete temporary directories immediately, rename variable
add 79781050f Merge remote-tracking branch 'origin/main' into main
add 14784c59d TIKA-3767 -- fix whitespace
add 750690297 TIKA-3769 -- improve marc mime detection
add d6c34c919 TIKA-3767 -- use @TempDir more often to simplify unit tests
add c212e0ad3 Bump azure-storage-blob from 12.16.0 to 12.16.1
add 4f8134da9 Merge remote-tracking branch 'origin/main' into main
add 14ca42d62 TIKA-3751: update maven-bundle-plugin
add 58a446bd2 Bump zstd-jni from 1.5.2-2 to 1.5.2-3
add 23a4d6942 Merge origin/dependabot/maven/com.github.luben-zstd-jni-1.5.2-3 into main
add 4122a8c88 Bump aws.version from 1.12.220 to 1.12.222
add 206a1eb5d Merge origin/dependabot/maven/aws.version-1.12.222 into main
add 4982e389b Bump jackson.version from 2.13.2 to 2.13.3 (#564)
add 38f8e1a54 Bump aws.version from 1.12.222 to 1.12.223
add 9f63c2966 TIKA-3751: add comment why we can't update
add 394746b71 TIKA-3751: update jackson-databind
add df5c784f0 Bump groovy-all from 2.4.9 to 2.4.21
add bb48354b5 Merge pull request #569 from apache/dependabot/maven/org.codehaus.groovy-groovy-all-2.4.21
add d470644e3 Bump aws.version from 1.12.223 to 1.12.224
add 67796d2e7 Merge pull request #570 from apache/dependabot/maven/aws.version-1.12.224
add c2f714e5f TIKA-3751: update plexus-utils
add f23d7bf93 TIKA-3751: update testcontainers
add 3e515e072 TIKA-3751: update org.osgi.compendium
add 481adfca7 TIKA-3751: update junit5; use variable for osgi compendium version
add 2dbcea768 TIKA-3751: add comment about failure to update jaxb
add 61b70a117 TIKA-3751: add comment about why test could fail
add 1888b1489 Bump jaxb-runtime from 2.3.6 to 3.0.2
This update added new revisions after undoing existing revisions.
That is to say, some revisions that were in the old version of the
branch are not in the new version. This situation occurs
when a user --force pushes a change and generates a repository
containing something like this:
* -- * -- B -- O -- O -- O (0755c0957)
\
N -- N -- N refs/heads/dependabot/maven/org.glassfish.jaxb-jaxb-runtime-3.0.2 (1888b1489)
You should already have received notification emails for all of the O
revisions, and so the following emails describe only the N revisions
from the common base, B.
Any revisions marked "omit" are not gone; other references still
refer to them. Any revisions marked "discard" are gone forever.
No new revisions were added by this update.
Summary of changes:
.../workflows/branch_1x-jdk11-build.yml | 32 +-
...in-jdk11-build.yml => branch_1x-jdk8-build.yml} | 8 +-
.github/workflows/main-jdk11-build.yml | 2 +-
.github/workflows/main-jdk17-build.yml | 2 +-
.github/workflows/main-jdk8-build.yml | 2 +-
CHANGES.txt | 59 ++-
pom.xml | 6 +-
tika-app/pom.xml | 9 +-
.../src/main/java/org/apache/tika/cli/TikaCLI.java | 23 +-
.../tika/cli/TikaCLIBatchCommandLineTest.java | 18 +-
.../tika/cli/TikaCLIBatchIntegrationTest.java | 21 +-
.../test/java/org/apache/tika/cli/TikaCLITest.java | 157 +++----
.../tika/extractor/TestEmbeddedDocumentUtil.java | 6 +-
tika-batch/pom.xml | 9 +-
.../tika/batch/CommandLineParserBuilderTest.java | 2 +-
.../RecursiveParserWrapperFSConsumerTest.java | 4 +-
.../org/apache/tika/batch/fs/BatchDriverTest.java | 61 +--
.../org/apache/tika/batch/fs/BatchProcessTest.java | 61 +--
.../org/apache/tika/batch/fs/FSBatchTestBase.java | 33 +-
.../apache/tika/batch/fs/FSFileResourceTest.java | 6 +-
.../java/org/apache/tika/batch/fs/FSUtilTest.java | 20 +-
.../apache/tika/batch/fs/HandlerBuilderTest.java | 6 +-
.../tika/batch/fs/OutputStreamFactoryTest.java | 8 +-
.../tika/batch/fs/strawman/StrawmanTest.java | 2 +-
tika-bom/pom.xml | 128 +++---
tika-bundles/pom.xml | 15 +-
tika-bundles/tika-bundle-standard/pom.xml | 7 +-
.../test/java/org/apache/tika/bundle/BundleIT.java | 32 +-
tika-core/pom.xml | 7 +-
.../java/org/apache/tika/config/TikaConfig.java | 139 ++++++-
.../EmbeddedDocumentExtractorFactory.java | 13 +-
.../tika/extractor/EmbeddedDocumentUtil.java | 28 +-
.../ParsingEmbeddedDocumentExtractor.java | 8 +-
.../ParsingEmbeddedDocumentExtractorFactory.java | 28 +-
.../main/java/org/apache/tika/io/EndianUtils.java | 19 +
.../java/org/apache/tika/metadata/Metadata.java | 104 ++++-
.../java/org/apache/tika/metadata/PagedText.java | 2 +
.../java/org/apache/tika/metadata/Rendering.java | 16 +-
.../apache/tika/metadata/TikaCoreProperties.java | 35 +-
.../{PagedText.java => TikaPagedText.java} | 21 +-
.../main/java/org/apache/tika/metadata/WARC.java | 23 +-
.../metadata/filter/DefaultMetadataFilter.java | 6 +-
.../metadata/writefilter/MetadataWriteFilter.java | 52 +++
.../writefilter/MetadataWriteFilterFactory.java | 14 +-
.../metadata/writefilter/StandardWriteFilter.java | 458 +++++++++++++++++++++
.../writefilter/StandardWriteFilterFactory.java | 118 ++++++
.../org/apache/tika/parser/AutoDetectParser.java | 33 +-
.../apache/tika/parser/AutoDetectParserConfig.java | 52 ++-
.../org/apache/tika/parser/CompositeParser.java | 39 +-
.../java/org/apache/tika/parser/DefaultParser.java | 37 +-
.../org/apache/tika/parser/RenderingParser.java | 13 +-
.../tika/parser/external/ExternalParser.java | 3 +
.../tika/parser/external2/ExternalParser.java | 15 +-
.../apache/tika/renderer/CompositeRenderer.java | 102 +++++
.../tika/renderer/PageBasedRenderResults.java | 50 +++
.../org/apache/tika/renderer/PageRangeRequest.java | 60 +++
.../org/apache/tika/renderer/RenderRequest.java | 21 +-
.../org/apache/tika/renderer/RenderResult.java | 92 +++++
.../org/apache/tika/renderer/RenderResults.java | 35 +-
.../java/org/apache/tika/renderer/Renderer.java | 62 +++
.../org/apache/tika/renderer/RenderingState.java | 17 +-
.../org/apache/tika/renderer/RenderingTracker.java | 26 +-
.../tika/sax/ContentHandlerDecoratorFactory.java | 13 +-
.../java/org/apache/tika/sax/StandardsText.java | 2 +-
.../java/org/apache/tika/utils/ParserUtils.java | 15 +-
.../org/apache/tika/mime/tika-mimetypes.xml | 61 ++-
.../org/apache/tika/TestRereadableInputStream.java | 25 +-
.../org/apache/tika/config/TikaConfigTest.java | 1 -
.../java/org/apache/tika/fork/ForkParserTest.java | 56 +--
.../apache/tika/fork/ForkParserTikaBinTest.java | 13 +-
.../java/org/apache/tika/io/EndianUtilsTest.java | 18 +
.../org/apache/tika/io/TikaInputStreamTest.java | 7 +-
.../writefilter/StandardWriteFilterTest.java | 230 +++++++++++
.../tika/pipes/async/AsyncProcessorTest.java | 17 +-
.../org/apache/tika/config/TIKA-3695-fields.xml | 40 ++
.../resources/org/apache/tika/config/TIKA-3695.xml | 33 ++
tika-eval/pom.xml | 11 +-
tika-eval/tika-eval-app/pom.xml | 2 +-
.../apache/tika/eval/app/AnalyzerManagerTest.java | 10 +-
.../apache/tika/eval/app/ComparerBatchTest.java | 25 +-
.../apache/tika/eval/app/ProfilerBatchTest.java | 36 +-
.../apache/tika/eval/app/SimpleComparerTest.java | 24 +-
.../org/apache/tika/eval/app/TikaEvalCLITest.java | 34 +-
.../tika/eval/app/db/AbstractBufferTest.java | 9 +-
.../apache/tika/eval/app/io/ExtractReaderTest.java | 8 +-
.../tika/eval/app/io/FatalExceptionReaderTest.java | 2 +-
.../tika/eval/app/reports/ResultsReporterTest.java | 10 +-
.../eval/app/tools/TopCommonTokenCounterTest.java | 18 +-
tika-eval/tika-eval-core/pom.xml | 3 +-
.../apache/tika/eval/core/langid/LangIdTest.java | 8 +-
.../core/metadata/TikaEvalMetadataFilterTest.java | 4 +-
.../tika/eval/core/textstats/TextStatsTest.java | 4 +-
.../tika/eval/core/tokens/TokenCounterTest.java | 11 +-
.../apache/tika/eval/core/util/LanguageIdTest.java | 11 +-
.../apache/tika/eval/core/util/MimeUtilTest.java | 12 +-
tika-example/pom.xml | 11 +-
.../tika/example/AdvancedTypeDetectorTest.java | 5 +-
.../tika/example/ContentHandlerExampleTest.java | 15 +-
.../tika/example/DumpTikaConfigExampleTest.java | 24 +-
.../tika/example/ExtractEmbeddedFilesTest.java | 12 +-
.../tika/example/LanguageDetectorExampleTest.java | 8 +-
.../tika/example/SimpleTextExtractorTest.java | 2 +-
.../tika/example/SimpleTypeDetectorTest.java | 2 +-
.../apache/tika/example/TestParsingExample.java | 37 +-
.../tika/example/TextStatsFromTikaEvalTest.java | 4 +-
.../apache/tika/example/TranslatorExampleTest.java | 8 +-
tika-fuzzing/pom.xml | 9 +-
tika-fuzzing/src/test/java/TestFuzzingCLI.java | 8 +-
tika-fuzzing/src/test/java/TestTransformer.java | 6 +-
tika-integration-tests/pom.xml | 3 +-
.../pom.xml | 2 +-
.../opensearch/tests/TikaPipesOpenSearchTest.java | 2 +-
.../tika-pipes-s3-integration-tests/pom.xml | 2 +-
.../tika-pipes-solr-integration-tests/pom.xml | 2 +-
.../tika/pipes/solr/tests/TikaPipesSolr8Test.java | 2 +-
...PipesSolr8Test.java => TikaPipesSolr9Test.java} | 4 +-
...pesSolr8Test.java => TikaPipesSolr9ZkTest.java} | 21 +-
.../pipes/solr/tests/TikaPipesSolrTestBase.java | 18 +
.../tika-resource-loading-tests}/pom.xml | 31 +-
.../org/apache/custom/parser/CustomParserTest.java | 31 +-
.../org/apache/custom/parser/MyCustomParser.java | 51 +++
.../services/org.apache.tika.parser.Parser | 5 +-
tika-java7/pom.xml | 9 +-
.../filetypedetector/TikaFileTypeDetectorTest.java | 26 +-
tika-langdetect/pom.xml | 14 +-
tika-langdetect/tika-langdetect-lingo24/pom.xml | 3 +-
.../lingo24/Lingo24LangDetectorTest.java | 10 +-
tika-langdetect/tika-langdetect-mitll-text/pom.xml | 3 +-
.../langdetect/mitll/TextLangDetectorTest.java | 8 +-
tika-langdetect/tika-langdetect-opennlp/pom.xml | 2 +-
.../metadatafilter/OpenNLPMetadataFilter.java | 49 +++
.../langdetect/opennlp/OpenNLPDetectorTest.java | 8 +-
tika-langdetect/tika-langdetect-optimaize/pom.xml | 2 +-
.../optimaize/OptimaizeLangDetector.java | 13 +-
.../metadatafilter/OptimaizeMetadataFilter.java | 49 +++
.../optimaize/OptimaizeLangDetectorTest.java | 31 +-
.../tika-langdetect-test-commons/pom.xml | 2 +-
tika-langdetect/tika-langdetect-tika/pom.xml | 2 +-
.../langdetect/tika/LanguageIdentifierTest.java | 18 +-
.../tika/langdetect/tika/LanguageProfileTest.java | 6 +-
.../tika/LanguageProfilerBuilderTest.java | 16 +-
.../tika/langdetect/tika/ProfilingWriterTest.java | 4 +-
tika-parent/pom.xml | 106 +++--
tika-parsers/pom.xml | 2 +-
tika-parsers/tika-parsers-extended/pom.xml | 2 +-
.../tika-parser-scientific-module/pom.xml | 2 +-
.../tika-parser-scientific-package/pom.xml | 2 +-
.../tika-parser-sqlite3-module/pom.xml | 2 +-
.../tika-parser-sqlite3-package/pom.xml | 2 +-
.../pom.xml | 2 +-
tika-parsers/tika-parsers-ml/pom.xml | 2 +-
.../tika-parsers-ml/tika-age-recogniser/pom.xml | 6 +-
tika-parsers/tika-parsers-ml/tika-dl/pom.xml | 2 +-
.../tika-parser-advancedmedia-module/pom.xml | 2 +-
.../tika-parser-advancedmedia-package/pom.xml | 9 +-
.../tika-parsers-ml/tika-parser-nlp-module/pom.xml | 4 +-
.../tika-parser-nlp-package/pom.xml | 9 +-
.../tika-parsers-ml/tika-transcribe-aws/pom.xml | 4 +-
tika-parsers/tika-parsers-standard/pom.xml | 2 +-
.../tika-parsers-standard-modules/pom.xml | 3 +-
.../tika-parser-apple-module/pom.xml | 2 +-
.../tika-parser-audiovideo-module/pom.xml | 2 +-
.../org/apache/tika/parser/audio/MidiParser.java | 2 -
.../apache/tika/parser/mp4/TikaMp4BoxHandler.java | 16 +-
.../tika/parser/mp4/boxes/TikaUserDataBox.java | 6 +-
.../tika-parser-cad-module/pom.xml | 8 +-
.../org/apache/tika/parser/dgn/DGN8Parser.java | 88 ++++
.../java/org/apache/tika/parser/dwg/DWGParser.java | 10 +-
.../services/org.apache.tika.parser.Parser | 1 +
.../apache/tika/parser/dgn/DGN8ParserTest.java} | 33 +-
.../org/apache/tika/parser/dwg/DWGParserTest.java | 25 +-
.../src/test/resources/test-documents/testDGN7.dgn | Bin 0 -> 33792 bytes
.../src/test/resources/test-documents/testDGN8.dgn | Bin 0 -> 28160 bytes
.../resources/test-documents/testDWG-AC1027.dwg | Bin 0 -> 265260 bytes
.../resources/test-documents/testDWG-AC1032.dwg | Bin 0 -> 158593 bytes
.../tika-parser-code-module/pom.xml | 2 +-
.../tika-parser-crypto-module/pom.xml | 2 +-
.../tika-parser-digest-commons/pom.xml | 2 +-
.../tika-parser-font-module/pom.xml | 2 +-
.../tika-parser-html-commons/pom.xml | 2 +-
.../tika-parser-html-module/pom.xml | 2 +-
.../tika-parser-image-module/pom.xml | 2 +-
.../tika-parser-jdbc-commons/pom.xml | 2 +-
.../tika-parser-mail-commons/pom.xml | 2 +-
.../tika-parser-mail-module/pom.xml | 2 +-
.../tika-parser-microsoft-module/pom.xml | 2 +-
.../detect/microsoft/POIFSContainerDetector.java | 71 +++-
.../parser/microsoft/AbstractPOIFSExtractor.java | 33 +-
.../tika/parser/microsoft/ExcelExtractor.java | 2 +-
.../tika/parser/microsoft/HSLFExtractor.java | 73 ++--
.../tika/parser/microsoft/JackcessExtractor.java | 2 +-
.../apache/tika/parser/microsoft/OfficeParser.java | 28 +-
.../tika/parser/microsoft/OutlookExtractor.java | 44 +-
.../tika/parser/microsoft/WordExtractor.java | 2 +-
.../microsoft/onenote/OneNoteTreeWalker.java | 6 +-
.../microsoft/ooxml/AbstractOOXMLExtractor.java | 2 +-
.../parser/microsoft/pst/OutlookPSTParser.java | 2 +-
.../tika/parser/microsoft/xml/WordMLParser.java | 8 +-
.../parser/microsoft/PowerPointParserTest.java | 8 +-
.../tika-parser-miscoffice-module/pom.xml | 2 +-
.../apache/tika/parser/odf/OpenDocumentParser.java | 2 +-
.../tika/parser/indesign/IDMLParserTest.java | 4 +
.../org/apache/tika/parser/odf/ODFParserTest.java | 2 +-
.../tika-parser-news-module/pom.xml | 2 +-
.../tika-parser-ocr-module/pom.xml | 2 +-
.../tika-parser-pdf-module/pom.xml | 9 +-
.../apache/tika/parser/pdf/AbstractPDF2XHTML.java | 240 ++++++++---
.../java/org/apache/tika/parser/pdf/OCR2XHTML.java | 8 +-
.../java/org/apache/tika/parser/pdf/PDF2XHTML.java | 49 ++-
.../tika/parser/pdf/PDFMarkedContent2XHTML.java | 3 +-
.../java/org/apache/tika/parser/pdf/PDFParser.java | 169 +++++++-
.../apache/tika/parser/pdf/PDFParserConfig.java | 260 +++++++-----
.../tika/parser/pdf/PDMetadataExtractor.java | 4 +-
.../pdf/{ => image}/ImageGraphicsEngine.java | 92 +++--
.../pdf/image/ImageGraphicsEngineFactory.java | 44 ++
.../tika/renderer/pdf/mutool/MuPDFRenderer.java | 149 +++++++
.../pdf/pdfbox}/NoTextPDFRenderer.java | 2 +-
.../renderer/pdf/pdfbox/PDDocumentRenderer.java | 19 +-
.../tika/renderer/pdf/pdfbox/PDFBoxRenderer.java | 211 ++++++++++
.../renderer/pdf/pdfbox/PDFRenderingState.java | 33 +-
.../renderer/pdf/pdfbox/TextOnlyPDFRenderer.java | 106 +++++
.../pdf/pdfbox/VectorGraphicsOnlyPDFRenderer.java | 133 ++++++
.../pdf/MyCustomImageGraphicsEngineFactory.java | 44 ++
.../org/apache/tika/parser/pdf/PDFParserTest.java | 82 ++--
.../apache/tika/parser/pdf/PDFRenderingTest.java | 132 ++++++
.../pdf/tika-config-custom-graphics-engine.xml | 28 ++
.../tika/parser/pdf/tika-rendering-config.xml | 34 ++
.../parser/pdf/tika-rendering-per-page-config.xml | 32 ++
.../resources/test-documents/testPDF_rotated.pdf | Bin 0 -> 38309 bytes
.../test-documents/testStandardsExtractor.pdf | Bin 143659 -> 0 bytes
.../tika-parser-pkg-module/pom.xml | 2 +-
.../java/org/apache/tika/parser/pkg/RarParser.java | 21 +-
.../tika-parser-text-module/pom.xml | 2 +-
.../pom.xml | 33 +-
.../org/apache/tika/parser/http/HttpParser.java | 103 +++++
.../org/apache/tika/parser/wacz/WACZParser.java | 162 ++++++++
.../org/apache/tika/parser/warc/WARCParser.java | 148 +++++++
.../services/org.apache.tika.parser.Parser | 5 +-
.../apache/tika/parser/http/HttpParserTest.java | 29 +-
.../apache/tika/parser/wacz/WACZParserTest.java | 28 +-
.../apache/tika/parser/warc/WARCParserTest.java} | 30 +-
.../src/test/resources/test-documents/cc.warc.gz | Bin 0 -> 5392 bytes
.../resources/test-documents/gzip_extra_sl.warc.gz | Bin 0 -> 459 bytes
.../test/resources/test-documents/http-response | 18 +
.../test/resources/test-documents/testWACZ.wacz | Bin
.../tika-parser-xml-module/pom.xml | 2 +-
.../tika-parser-xmp-commons/pom.xml | 2 +-
.../tika-parser-zip-commons/pom.xml | 2 +-
.../tika-parsers-standard-package/pom.xml | 7 +-
.../tika/detect/TestContainerAwareDetector.java | 4 +
.../java/org/apache/tika/mime/TestMimeTypes.java | 14 +
.../tika/parser/AutoDetectParserConfigTest.java | 67 +++
.../apache/tika/parser/crypto/TSDParserTest.java | 8 +-
.../parser/fork/ForkParserIntegrationTest.java | 2 +
.../tika/parser/microsoft/XML2003ParserTest.java | 4 +-
.../tika/parser/microsoft/rtf/RTFParserTest.java | 14 +
.../tika/parser/ocr/TesseractOCRParserTest.java | 5 +
.../org/apache/tika/parser/pdf/PDFParserTest.java | 27 ++
.../sax/StandardsExtractingContentHandlerTest.java | 5 +-
.../UpcasingContentHandlerDecoratorFactory.java | 25 +-
.../apache/tika/utils/ServiceLoaderUtilsTest.java | 4 +-
.../resources/configs/tika-config-no-names.xml | 33 ++
...ka-config-upcasing-custom-handler-decorator.xml | 29 ++
.../resources/configs/tika-config-with-names.xml | 33 ++
.../configs/tika-rendering-mupdf-config.xml | 25 ++
.../test-documents/testStandardsExtractor.txt | 13 +
tika-pipes/pom.xml | 85 +++-
tika-pipes/tika-emitters/pom.xml | 3 +-
.../pom.xml | 26 +-
.../tika/pipes/emitter/azblob/AZBlobEmitter.java | 255 ++++++++++++
.../pipes/emitter/azblob/TestAZBlobEmitter.java | 52 +++
.../test/resources/config/tika-config-az-blob.xml | 30 ++
tika-pipes/tika-emitters/tika-emitter-fs/pom.xml | 2 +-
tika-pipes/tika-emitters/tika-emitter-gcs/pom.xml | 2 +-
.../tika-emitters/tika-emitter-opensearch/pom.xml | 4 +-
tika-pipes/tika-emitters/tika-emitter-s3/pom.xml | 2 +-
tika-pipes/tika-emitters/tika-emitter-solr/pom.xml | 2 +-
tika-pipes/tika-fetchers/pom.xml | 3 +-
.../pom.xml | 41 +-
.../tika/pipes/fetcher/azblob/AZBlobFetcher.java | 195 +++++++++
.../pipes/fetcher/azblob/TestAZBlobFetcher.java} | 44 +-
.../src/test/resources/tika-config-az-blob.xml | 32 ++
tika-pipes/tika-fetchers/tika-fetcher-gcs/pom.xml | 2 +-
.../tika/pipes/fetcher/s3/TestGCSFetcher.java | 11 +-
tika-pipes/tika-fetchers/tika-fetcher-http/pom.xml | 2 +-
tika-pipes/tika-fetchers/tika-fetcher-s3/pom.xml | 2 +-
tika-pipes/tika-httpclient-commons/pom.xml | 2 +-
.../org/apache/tika/client/HttpClientFactory.java | 15 +-
tika-pipes/tika-pipes-iterators/pom.xml | 3 +-
.../pom.xml | 26 +-
.../pipesiterator/azblob/AZBlobPipesIterator.java | 155 +++++++
.../azblob/TestAZBlobPipesIterator.java | 99 +++++
.../src/test}/resources/log4j2.xml | 0
.../tika-pipes-iterator-csv/pom.xml | 2 +-
.../tika-pipes-iterator-gcs/pom.xml | 4 +-
.../tika-pipes-iterator-jdbc/pom.xml | 2 +-
.../pipesiterator/jdbc/TestJDBCPipesIterator.java | 6 +-
.../tika-pipes-iterator-s3/pom.xml | 2 +-
.../src/test}/resources/log4j2.xml | 0
.../tika-pipes-iterator-solr/pom.xml | 2 +-
tika-serialization/pom.xml | 4 +-
tika-server/pom.xml | 2 +-
tika-server/tika-server-client/pom.xml | 2 +-
tika-server/tika-server-core/pom.xml | 2 +-
.../server/core/DefaultInputStreamFactory.java | 7 +
.../tika/server/core/FetcherStreamFactory.java | 30 +-
.../tika/server/core/InputStreamFactory.java | 15 +
.../org/apache/tika/server/core/TikaServerCli.java | 67 ++-
.../apache/tika/server/core/TikaServerConfig.java | 56 ++-
.../apache/tika/server/core/TikaServerProcess.java | 56 ++-
.../tika/server/core/TikaServerWatchDog.java | 28 +-
.../org/apache/tika/server/core/TlsConfig.java | 171 ++++++++
.../server/core/resource/DetectorResource.java | 5 +-
.../server/core/resource/MetadataResource.java | 5 +-
.../core/resource/RecursiveMetadataResource.java | 2 +-
.../tika/server/core/resource/TikaResource.java | 15 +-
.../server/core/resource/UnpackerResource.java | 6 +-
.../org/apache/tika/server/core/CXFTestBase.java | 35 +-
.../tika/server/core/IntegrationTestBase.java | 23 +-
.../org/apache/tika/server/core/TikaPipesTest.java | 3 +-
.../tika/server/core/TikaResourceFetcherTest.java | 110 +++++
.../core/TikaServerAsyncIntegrationTest.java | 9 +-
.../tika/server/core/TikaServerConfigTest.java | 48 +++
.../server/core/TikaServerIntegrationTest.java | 213 ++++++++++
.../core/TikaServerPipesIntegrationTest.java | 27 +-
.../tika-config-server-fetcher-template.xml | 38 ++
.../tika-config-server-tls-one-way-template.xml | 43 ++
.../tika-config-server-tls-two-way-template.xml | 46 +++
.../resources/configs/tika-config-server-tls.xml | 45 ++
.../src/test/resources/ssl-keys/README.txt | 28 ++
.../resources/ssl-keys/tika-client-keystore.p12 | Bin 0 -> 2505 bytes
.../resources/ssl-keys/tika-client-truststore.p12 | Bin 0 -> 3429 bytes
.../src/test/resources/ssl-keys/tika-client.crt | Bin 0 -> 789 bytes
.../resources/ssl-keys/tika-server-keystore.p12 | Bin 0 -> 2505 bytes
.../resources/ssl-keys/tika-server-truststore.p12 | Bin 0 -> 3429 bytes
.../src/test/resources/ssl-keys/tika-server.crt | Bin 0 -> 789 bytes
tika-server/tika-server-eval/pom.xml | 9 +-
tika-server/tika-server-standard/pom.xml | 24 +-
.../standard/resource/XMPMetadataResource.java | 3 +-
.../apache/tika/server/standard/FetcherTest.java | 12 +-
...herTest.java => OpenNLPMetadataFilterTest.java} | 74 ++--
...rTest.java => OptimaizeMetadataFilterTest.java} | 73 ++--
.../apache/tika/server/standard/TikaPipesTest.java | 28 +-
.../tika/server/standard/TikaResourceTest.java | 5 +
.../tika-config-langdetect-opennlp-filter.xml | 32 ++
.../tika-config-langdetect-optimaize-filter.xml | 32 ++
tika-translate/pom.xml | 70 ++--
.../translate/impl/CachedTranslatorTest.java | 39 +-
.../translate/impl/GoogleTranslatorTest.java | 24 +-
.../impl/JoshuaNetworkTranslatorTest.java | 37 +-
.../translate/impl/Lingo24TranslatorTest.java | 27 +-
.../translate/impl/MarianTranslatorTest.java | 33 +-
.../translate/impl/MicrosoftTranslatorTest.java | 23 +-
.../translate/impl/MosesTranslatorTest.java | 16 +-
.../language/translate/impl/RTGTranslatorTest.java | 64 ++-
.../translate/impl/YandexTranslatorTest.java | 52 +--
tika-xmp/pom.xml | 9 +-
.../java/org/apache/tika/xmp/TikaToXMPTest.java | 27 +-
.../java/org/apache/tika/xmp/XMPMetadataTest.java | 61 +--
359 files changed, 8223 insertions(+), 2127 deletions(-)
rename tika-pipes/tika-pipes-iterators/tika-pipes-iterator-s3/src/test/resources/log4j.properties => .github/workflows/branch_1x-jdk11-build.yml (60%)
copy .github/workflows/{main-jdk11-build.yml => branch_1x-jdk8-build.yml} (89%)
copy tika-batch/src/test/java/org/apache/tika/batch/fs/strawman/StrawmanTest.java => tika-core/src/main/java/org/apache/tika/extractor/EmbeddedDocumentExtractorFactory.java (72%)
copy tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/DefaultInputStreamFactory.java => tika-core/src/main/java/org/apache/tika/extractor/ParsingEmbeddedDocumentExtractorFactory.java (54%)
copy tika-integration-tests/tika-pipes-solr-integration-tests/src/test/java/org/apache/tika/pipes/solr/tests/TikaPipesSolr8Test.java => tika-core/src/main/java/org/apache/tika/metadata/Rendering.java (73%)
copy tika-core/src/main/java/org/apache/tika/metadata/{PagedText.java => TikaPagedText.java} (61%)
copy tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/DefaultInputStreamFactory.java => tika-core/src/main/java/org/apache/tika/metadata/WARC.java (61%)
create mode 100644 tika-core/src/main/java/org/apache/tika/metadata/writefilter/MetadataWriteFilter.java
copy tika-batch/src/test/java/org/apache/tika/batch/fs/strawman/StrawmanTest.java => tika-core/src/main/java/org/apache/tika/metadata/writefilter/MetadataWriteFilterFactory.java (81%)
create mode 100644 tika-core/src/main/java/org/apache/tika/metadata/writefilter/StandardWriteFilter.java
create mode 100644 tika-core/src/main/java/org/apache/tika/metadata/writefilter/StandardWriteFilterFactory.java
copy tika-batch/src/test/java/org/apache/tika/batch/fs/strawman/StrawmanTest.java => tika-core/src/main/java/org/apache/tika/parser/RenderingParser.java (81%)
create mode 100644 tika-core/src/main/java/org/apache/tika/renderer/CompositeRenderer.java
create mode 100644 tika-core/src/main/java/org/apache/tika/renderer/PageBasedRenderResults.java
create mode 100644 tika-core/src/main/java/org/apache/tika/renderer/PageRangeRequest.java
copy tika-example/src/test/java/org/apache/tika/example/AdvancedTypeDetectorTest.java => tika-core/src/main/java/org/apache/tika/renderer/RenderRequest.java (64%)
mode change 100755 => 100644
create mode 100644 tika-core/src/main/java/org/apache/tika/renderer/RenderResult.java
copy tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/DefaultInputStreamFactory.java => tika-core/src/main/java/org/apache/tika/renderer/RenderResults.java (57%)
create mode 100644 tika-core/src/main/java/org/apache/tika/renderer/Renderer.java
copy tika-batch/src/test/java/org/apache/tika/batch/fs/strawman/StrawmanTest.java => tika-core/src/main/java/org/apache/tika/renderer/RenderingState.java (75%)
copy tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/DefaultInputStreamFactory.java => tika-core/src/main/java/org/apache/tika/renderer/RenderingTracker.java (64%)
copy tika-batch/src/test/java/org/apache/tika/batch/fs/strawman/StrawmanTest.java => tika-core/src/main/java/org/apache/tika/sax/ContentHandlerDecoratorFactory.java (73%)
create mode 100644 tika-core/src/test/java/org/apache/tika/metadata/writefilter/StandardWriteFilterTest.java
create mode 100644 tika-core/src/test/resources/org/apache/tika/config/TIKA-3695-fields.xml
create mode 100644 tika-core/src/test/resources/org/apache/tika/config/TIKA-3695.xml
copy tika-integration-tests/tika-pipes-solr-integration-tests/src/test/java/org/apache/tika/pipes/solr/tests/{TikaPipesSolr8Test.java => TikaPipesSolr9Test.java} (91%)
copy tika-integration-tests/tika-pipes-solr-integration-tests/src/test/java/org/apache/tika/pipes/solr/tests/{TikaPipesSolr8Test.java => TikaPipesSolr9ZkTest.java} (63%)
copy {tika-pipes/tika-httpclient-commons => tika-integration-tests/tika-resource-loading-tests}/pom.xml (61%)
copy tika-batch/src/test/java/org/apache/tika/batch/CommandLineParserBuilderTest.java => tika-integration-tests/tika-resource-loading-tests/src/test/java/org/apache/custom/parser/CustomParserTest.java (52%)
create mode 100644 tika-integration-tests/tika-resource-loading-tests/src/test/java/org/apache/custom/parser/MyCustomParser.java
copy {tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-cad-module/src/main => tika-integration-tests/tika-resource-loading-tests/src/test}/resources/META-INF/services/org.apache.tika.parser.Parser (91%)
create mode 100644 tika-langdetect/tika-langdetect-opennlp/src/main/java/org/apache/tika/langdetect/opennlp/metadatafilter/OpenNLPMetadataFilter.java
create mode 100644 tika-langdetect/tika-langdetect-optimaize/src/main/java/org/apache/tika/langdetect/optimaize/metadatafilter/OptimaizeMetadataFilter.java
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-cad-module/src/main/java/org/apache/tika/parser/dgn/DGN8Parser.java
copy tika-parsers/tika-parsers-standard/{tika-parsers-standard-package/src/test/java/org/apache/tika/parser/crypto/TSDParserTest.java => tika-parsers-standard-modules/tika-parser-cad-module/src/test/java/org/apache/tika/parser/dgn/DGN8ParserTest.java} (53%)
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-cad-module/src/test/resources/test-documents/testDGN7.dgn
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-cad-module/src/test/resources/test-documents/testDGN8.dgn
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-cad-module/src/test/resources/test-documents/testDWG-AC1027.dwg
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-cad-module/src/test/resources/test-documents/testDWG-AC1032.dwg
rename tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/{ => image}/ImageGraphicsEngine.java (85%)
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/image/ImageGraphicsEngineFactory.java
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/renderer/pdf/mutool/MuPDFRenderer.java
rename tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/{parser/pdf => renderer/pdf/pdfbox}/NoTextPDFRenderer.java (98%)
copy tika-integration-tests/tika-pipes-solr-integration-tests/src/test/java/org/apache/tika/pipes/solr/tests/TikaPipesSolr8Test.java => tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/renderer/pdf/pdfbox/PDDocumentRenderer.java (71%)
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/renderer/pdf/pdfbox/PDFBoxRenderer.java
copy tika-example/src/test/java/org/apache/tika/example/LanguageDetectorExampleTest.java => tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/renderer/pdf/pdfbox/PDFRenderingState.java (55%)
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/renderer/pdf/pdfbox/TextOnlyPDFRenderer.java
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/renderer/pdf/pdfbox/VectorGraphicsOnlyPDFRenderer.java
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/test/java/org/apache/tika/parser/pdf/MyCustomImageGraphicsEngineFactory.java
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/test/java/org/apache/tika/parser/pdf/PDFRenderingTest.java
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/test/resources/org/apache/tika/parser/pdf/tika-config-custom-graphics-engine.xml
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/test/resources/org/apache/tika/parser/pdf/tika-rendering-config.xml
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/test/resources/org/apache/tika/parser/pdf/tika-rendering-per-page-config.xml
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/test/resources/test-documents/testPDF_rotated.pdf
delete mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/test/resources/test-documents/testStandardsExtractor.pdf
copy tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/{tika-parser-html-module => tika-parser-webarchive-module}/pom.xml (76%)
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-webarchive-module/src/main/java/org/apache/tika/parser/http/HttpParser.java
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-webarchive-module/src/main/java/org/apache/tika/parser/wacz/WACZParser.java
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-webarchive-module/src/main/java/org/apache/tika/parser/warc/WARCParser.java
copy tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/{tika-parser-cad-module => tika-parser-webarchive-module}/src/main/resources/META-INF/services/org.apache.tika.parser.Parser (87%)
copy tika-batch/src/test/java/org/apache/tika/batch/CommandLineParserBuilderTest.java => tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-webarchive-module/src/test/java/org/apache/tika/parser/http/HttpParserTest.java (53%)
copy tika-batch/src/test/java/org/apache/tika/batch/CommandLineParserBuilderTest.java => tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-webarchive-module/src/test/java/org/apache/tika/parser/wacz/WACZParserTest.java (53%)
copy tika-parsers/tika-parsers-standard/{tika-parsers-standard-package/src/test/java/org/apache/tika/parser/crypto/TSDParserTest.java => tika-parsers-standard-modules/tika-parser-webarchive-module/src/test/java/org/apache/tika/parser/warc/WARCParserTest.java} (52%)
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-webarchive-module/src/test/resources/test-documents/cc.warc.gz
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-webarchive-module/src/test/resources/test-documents/gzip_extra_sl.warc.gz
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-webarchive-module/src/test/resources/test-documents/http-response
copy tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/{tika-parser-zip-commons => tika-parser-webarchive-module}/src/test/resources/test-documents/testWACZ.wacz (100%)
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-package/src/test/java/org/apache/tika/parser/AutoDetectParserConfigTest.java
copy tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/DefaultInputStreamFactory.java => tika-parsers/tika-parsers-standard/tika-parsers-standard-package/src/test/java/org/apache/tika/sax/UpcasingContentHandlerDecoratorFactory.java (56%)
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-package/src/test/resources/configs/tika-config-no-names.xml
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-package/src/test/resources/configs/tika-config-upcasing-custom-handler-decorator.xml
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-package/src/test/resources/configs/tika-config-with-names.xml
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-package/src/test/resources/configs/tika-rendering-mupdf-config.xml
create mode 100644 tika-parsers/tika-parsers-standard/tika-parsers-standard-package/src/test/resources/test-documents/testStandardsExtractor.txt
copy tika-pipes/tika-emitters/{tika-emitter-s3 => tika-emitter-az-blob}/pom.xml (86%)
create mode 100644 tika-pipes/tika-emitters/tika-emitter-az-blob/src/main/java/org/apache/tika/pipes/emitter/azblob/AZBlobEmitter.java
create mode 100644 tika-pipes/tika-emitters/tika-emitter-az-blob/src/test/java/org/apache/tika/pipes/emitter/azblob/TestAZBlobEmitter.java
create mode 100644 tika-pipes/tika-emitters/tika-emitter-az-blob/src/test/resources/config/tika-config-az-blob.xml
copy tika-pipes/tika-fetchers/{tika-fetcher-s3 => tika-fetcher-az-blob}/pom.xml (78%)
create mode 100644 tika-pipes/tika-fetchers/tika-fetcher-az-blob/src/main/java/org/apache/tika/pipes/fetcher/azblob/AZBlobFetcher.java
copy tika-pipes/tika-fetchers/{tika-fetcher-gcs/src/test/java/org/apache/tika/pipes/fetcher/s3/TestGCSFetcher.java => tika-fetcher-az-blob/src/test/java/org/apache/tika/pipes/fetcher/azblob/TestAZBlobFetcher.java} (55%)
create mode 100644 tika-pipes/tika-fetchers/tika-fetcher-az-blob/src/test/resources/tika-config-az-blob.xml
copy tika-pipes/tika-pipes-iterators/{tika-pipes-iterator-solr => tika-pipes-iterator-az-blob}/pom.xml (85%)
create mode 100644 tika-pipes/tika-pipes-iterators/tika-pipes-iterator-az-blob/src/main/java/org/apache/tika/pipes/pipesiterator/azblob/AZBlobPipesIterator.java
create mode 100644 tika-pipes/tika-pipes-iterators/tika-pipes-iterator-az-blob/src/test/java/org/apache/tika/pipes/pipesiterator/azblob/TestAZBlobPipesIterator.java
copy {tika-app/src/main => tika-pipes/tika-pipes-iterators/tika-pipes-iterator-az-blob/src/test}/resources/log4j2.xml (100%)
copy {tika-app/src/main => tika-pipes/tika-pipes-iterators/tika-pipes-iterator-s3/src/test}/resources/log4j2.xml (100%)
create mode 100644 tika-server/tika-server-core/src/main/java/org/apache/tika/server/core/TlsConfig.java
create mode 100644 tika-server/tika-server-core/src/test/java/org/apache/tika/server/core/TikaResourceFetcherTest.java
create mode 100644 tika-server/tika-server-core/src/test/resources/configs/tika-config-server-fetcher-template.xml
create mode 100644 tika-server/tika-server-core/src/test/resources/configs/tika-config-server-tls-one-way-template.xml
create mode 100644 tika-server/tika-server-core/src/test/resources/configs/tika-config-server-tls-two-way-template.xml
create mode 100644 tika-server/tika-server-core/src/test/resources/configs/tika-config-server-tls.xml
create mode 100644 tika-server/tika-server-core/src/test/resources/ssl-keys/README.txt
create mode 100644 tika-server/tika-server-core/src/test/resources/ssl-keys/tika-client-keystore.p12
create mode 100644 tika-server/tika-server-core/src/test/resources/ssl-keys/tika-client-truststore.p12
create mode 100644 tika-server/tika-server-core/src/test/resources/ssl-keys/tika-client.crt
create mode 100644 tika-server/tika-server-core/src/test/resources/ssl-keys/tika-server-keystore.p12
create mode 100644 tika-server/tika-server-core/src/test/resources/ssl-keys/tika-server-truststore.p12
create mode 100644 tika-server/tika-server-core/src/test/resources/ssl-keys/tika-server.crt
copy tika-server/tika-server-standard/src/test/java/org/apache/tika/server/standard/{FetcherTest.java => OpenNLPMetadataFilterTest.java} (54%)
copy tika-server/tika-server-standard/src/test/java/org/apache/tika/server/standard/{FetcherTest.java => OptimaizeMetadataFilterTest.java} (56%)
create mode 100644 tika-server/tika-server-standard/src/test/resources/config/tika-config-langdetect-opennlp-filter.xml
create mode 100644 tika-server/tika-server-standard/src/test/resources/config/tika-config-langdetect-optimaize-filter.xml