fix: pass header to Tika if PDF_EXTRACT_IMAGES is true

This commit is contained in:
ayan4m1 2025-04-20 17:36:40 +02:00
parent 852d9dcbe9
commit 039dec6820

View File

@ -99,6 +99,9 @@ class TikaLoader:
else:
headers = {}
if self.kwargs.get("PDF_EXTRACT_IMAGES") == True:
headers['X-Tika-PDFextractInlineImages'] = 'true'
endpoint = self.url
if not endpoint.endswith("/"):
endpoint += "/"