This is an automated email from the ASF dual-hosted git repository.
tallison pushed a change to branch TIKA-4712
in repository https://gitbox.apache.org/repos/asf/tika.git
from 88f8ac6c38 TIKA-4712 -- initial steps for unit tests
add c5b9849d9f [TIKA-4327] set TZ because of metadata-extractor change in
update (#2753)
add 0a0b7e718d TIKA-4717 -- update/publish initial 4.0.0-SNAPSHOT docs
(#2756)
add 4cf115c0e2 TIKA-4716 (#2755)
add 9e1efa4d73 Update pipes docs (#2759)
add 3c64ae76e8 Merge branch 'main' into TIKA-4712
No new revisions were added by this update.
Summary of changes:
.github/workflows/main-jdk17-build.yml | 2 +
CHANGES.txt | 3 +
docs/build-docs.sh | 53 ++
.../advanced/flores-eval-20260320.txt | 0
.../ROOT/examples/external-parser-exiftool.json | 1 +
.../ROOT/examples/external-parser-ffmpeg.json | 1 +
.../ROOT/examples/external-parser-multi.json | 1 +
.../modules/ROOT/examples/external-parser-sox.json | 1 +
docs/modules/ROOT/examples/pipes-fs-emitter.json | 1 +
docs/modules/ROOT/examples/pipes-fs-fetcher.json | 1 +
docs/modules/ROOT/examples/pipes-fs-pipeline.json | 1 +
docs/modules/ROOT/nav.adoc | 7 +
.../pages/advanced/generative-language-model.adoc | 4 +-
.../advanced/integration-testing/tika-server.adoc | 4 +-
.../pages/advanced/language-detection-build.adoc | 2 +-
.../ROOT/pages/advanced/language-detection.adoc | 5 +-
.../configuration/parsers/external-parser.adoc | 176 +++++++
docs/modules/ROOT/pages/developers/index.adoc | 2 +-
docs/modules/ROOT/pages/index.adoc | 4 +
docs/modules/ROOT/pages/maintainers/site.adoc | 52 +-
.../pages/migration-to-4x/migrating-to-4x.adoc | 72 ++-
docs/modules/ROOT/pages/pipes/configuration.adoc | 152 ++++++
docs/modules/ROOT/pages/pipes/emitters.adoc | 220 ++++++++
docs/modules/ROOT/pages/pipes/fetchers.adoc | 245 +++++++++
docs/modules/ROOT/pages/pipes/getting-started.adoc | 135 +++++
docs/modules/ROOT/pages/pipes/index.adoc | 40 +-
docs/modules/ROOT/pages/pipes/iterators.adoc | 212 ++++++++
docs/modules/ROOT/pages/pipes/reporters.adoc | 93 ++++
docs/modules/ROOT/pages/pipes/unpack-config.adoc | 2 +-
docs/modules/ROOT/pages/security.adoc | 18 +-
.../ROOT/pages/using-tika/java-api/index.adoc | 51 +-
docs/supplemental-ui/partials/toolbar.hbs | 3 +
.../services/org.apache.tika.parser.Parser | 16 -
.../apache/tika/detect/FileCommandDetector.java | 3 +-
.../org/apache/tika/embedder/ExternalEmbedder.java | 13 +-
.../parser/external/CompositeExternalParser.java | 44 --
.../tika/parser/external/ExternalParser.java | 581 +++++++--------------
.../ExternalParserConfig.java | 69 ++-
.../external/ExternalParsersConfigReader.java | 223 --------
.../ExternalParsersConfigReaderMetKeys.java | 43 --
.../parser/external/ExternalParsersFactory.java | 67 ---
.../apache/tika/parser/external/package-info.java | 22 -
.../tika/parser/external2/ExternalParser.java | 227 --------
.../java/org/apache/tika/utils/ProcessUtils.java | 74 +++
.../java/org/apache/tika/utils/StreamGobbler.java | 52 +-
.../tika/parser/external/tika-external-parsers.xml | 117 -----
.../tika/detect/siegfried/SiegfriedDetector.java | 3 +-
tika-parent/pom.xml | 2 +-
.../org/apache/tika/parser/gdal/GDALParser.java | 5 +-
.../apache/tika/parser/gdal/TestGDALParser.java | 6 +-
.../parser/scientific/integration/TestParsers.java | 11 -
.../apache/tika/parser/AutoDetectParserTest.java | 8 -
.../org/apache/tika/parser/pdf/PDFParserTest.java | 4 +-
.../apache/tika/parser/pkg/UnrarParserTest.java | 4 +-
.../apache/tika/parser/dwg/DWGParserConfig.java | 4 +-
.../org/apache/tika/parser/dwg/DWGParserTest.java | 4 +-
.../apache/tika/parser/image/JpegParserTest.java | 20 +
.../apache/tika/parser/ocr/TesseractOCRParser.java | 6 +-
.../renderer/pdf/poppler/PopplerRendererTest.java | 4 +-
.../apache/tika/parser/pkg/UnrarParserTest.java | 4 +-
.../apache/tika/parser/strings/StringsParser.java | 6 +-
.../tika/parser/strings/StringsParserTest.java | 4 +-
.../tika/parser/external/ExternalParserTest.java | 195 +++++++
.../tika/parser/external2/ExternalParserTest.java | 100 ----
.../configs/TIKA-3557-exiftool-example.json | 6 +-
.../src/test/resources/configs/TIKA-3557.json | 2 +-
...-example.json => external-parser-exiftool.json} | 15 +-
.../resources/configs/external-parser-ffmpeg.json | 35 ++
.../resources/configs/external-parser-multi.json | 47 ++
.../resources/configs/external-parser-sox.json | 37 ++
.../services/org.apache.tika.parser.Parser | 16 -
.../tika/server/standard/TikaParsersTest.java | 4 +-
72 files changed, 2289 insertions(+), 1378 deletions(-)
create mode 100755 docs/build-docs.sh
rename docs/modules/ROOT/{pages =>
attachments}/advanced/flores-eval-20260320.txt (100%)
create mode 120000 docs/modules/ROOT/examples/external-parser-exiftool.json
create mode 120000 docs/modules/ROOT/examples/external-parser-ffmpeg.json
create mode 120000 docs/modules/ROOT/examples/external-parser-multi.json
create mode 120000 docs/modules/ROOT/examples/external-parser-sox.json
create mode 120000 docs/modules/ROOT/examples/pipes-fs-emitter.json
create mode 120000 docs/modules/ROOT/examples/pipes-fs-fetcher.json
create mode 120000 docs/modules/ROOT/examples/pipes-fs-pipeline.json
create mode 100644
docs/modules/ROOT/pages/configuration/parsers/external-parser.adoc
create mode 100644 docs/modules/ROOT/pages/pipes/configuration.adoc
create mode 100644 docs/modules/ROOT/pages/pipes/emitters.adoc
create mode 100644 docs/modules/ROOT/pages/pipes/fetchers.adoc
create mode 100644 docs/modules/ROOT/pages/pipes/getting-started.adoc
create mode 100644 docs/modules/ROOT/pages/pipes/iterators.adoc
create mode 100644 docs/modules/ROOT/pages/pipes/reporters.adoc
create mode 100644 docs/supplemental-ui/partials/toolbar.hbs
delete mode 100644
tika-app/src/main/resources/META-INF/services/org.apache.tika.parser.Parser
delete mode 100644
tika-core/src/main/java/org/apache/tika/parser/external/CompositeExternalParser.java
rename tika-core/src/main/java/org/apache/tika/parser/{external2 =>
external}/ExternalParserConfig.java (59%)
delete mode 100644
tika-core/src/main/java/org/apache/tika/parser/external/ExternalParsersConfigReader.java
delete mode 100644
tika-core/src/main/java/org/apache/tika/parser/external/ExternalParsersConfigReaderMetKeys.java
delete mode 100644
tika-core/src/main/java/org/apache/tika/parser/external/ExternalParsersFactory.java
delete mode 100644
tika-core/src/main/java/org/apache/tika/parser/external/package-info.java
delete mode 100644
tika-core/src/main/java/org/apache/tika/parser/external2/ExternalParser.java
delete mode 100644
tika-core/src/main/resources/org/apache/tika/parser/external/tika-external-parsers.xml
create mode 100644
tika-serialization/src/test/java/org/apache/tika/parser/external/ExternalParserTest.java
delete mode 100644
tika-serialization/src/test/java/org/apache/tika/parser/external2/ExternalParserTest.java
copy
tika-serialization/src/test/resources/configs/{TIKA-3557-exiftool-example.json
=> external-parser-exiftool.json} (54%)
create mode 100644
tika-serialization/src/test/resources/configs/external-parser-ffmpeg.json
create mode 100644
tika-serialization/src/test/resources/configs/external-parser-multi.json
create mode 100644
tika-serialization/src/test/resources/configs/external-parser-sox.json
delete mode 100644
tika-server/tika-server-standard/src/main/resources/META-INF/services/org.apache.tika.parser.Parser