This is an automated email from the ASF dual-hosted git repository.
tallison pushed a commit to branch branch_3x
in repository https://gitbox.apache.org/repos/asf/tika.git
The following commit(s) were added to refs/heads/branch_3x by this push:
new c20f28529 TIKA-4465 -- fix inputstream type
c20f28529 is described below
commit c20f28529a00b37a5cc5151265a0f92310858be4
Author: tallison <[email protected]>
AuthorDate: Mon Aug 18 16:19:36 2025 -0400
TIKA-4465 -- fix inputstream type
---
.../src/main/java/org/apache/tika/parser/pdf/AbstractPDF2XHTML.java | 2 +-
1 file changed, 1 insertion(+), 1 deletion(-)
diff --git
a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/AbstractPDF2XHTML.java
b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/AbstractPDF2XHTML.java
index 132efa3f9..11726a716 100644
---
a/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/AbstractPDF2XHTML.java
+++
b/tika-parsers/tika-parsers-standard/tika-parsers-standard-modules/tika-parser-pdf-module/src/main/java/org/apache/tika/parser/pdf/AbstractPDF2XHTML.java
@@ -556,7 +556,7 @@ class AbstractPDF2XHTML extends PDFTextStripper {
try (TemporaryResources tmp = new TemporaryResources()) {
try (RenderResult renderResult = renderCurrentPage(pdPage,
context, tmp)) {
Metadata renderMetadata = renderResult.getMetadata();
- try (TikaInputStream tis = renderResult.getInputStream()) {
+ try (TikaInputStream tis =
TikaInputStream.get(renderResult.getInputStream())) {
renderMetadata.set(TikaCoreProperties.CONTENT_TYPE_PARSER_OVERRIDE,
ocrImageMediaType.toString());
ocrParser.parse(tis, new EmbeddedContentHandler(new
BodyContentHandler(xhtml)),