aboutsummaryrefslogtreecommitdiff
path: root/src/server/chunker/pdf_chunker.py
diff options
context:
space:
mode:
Diffstat (limited to 'src/server/chunker/pdf_chunker.py')
-rw-r--r--src/server/chunker/pdf_chunker.py2
1 files changed, 1 insertions, 1 deletions
diff --git a/src/server/chunker/pdf_chunker.py b/src/server/chunker/pdf_chunker.py
index 697550f2e..9d4cfb1b2 100644
--- a/src/server/chunker/pdf_chunker.py
+++ b/src/server/chunker/pdf_chunker.py
@@ -153,7 +153,7 @@ class ElementExtractor:
xref = img_info[0] # XREF of the image in the PDF
base_image = page.parent.extract_image(xref) # Extract the image by its XREF
image_bytes = base_image["image"]
- image = Image.open(io.BytesIO(image_bytes)) # Convert bytes to PIL image
+ image = Image.open(io.BytesIO(image_bytes)).convert("RGB") # Ensure it's RGB before saving as PNG
width_ratio = img.width / page.rect.width # Scale factor for width
height_ratio = img.height / page.rect.height # Scale factor for height