presenton/servers/fastapi/image_processor/image_from_pptx.py
2025-05-13 02:35:30 +05:45

34 lines
906 B
Python

import io
import os
import subprocess
from typing import List
from image_processor.utils import get_page_images_from_pdf
def get_pdf_from_pptx(pptx_path: str, temp_dir: str) -> str:
base_name = os.path.splitext(os.path.basename(pptx_path))[0]
print(base_name)
result = subprocess.run(
f'{os.getenv("LIBREOFFICE")} --convert-to pdf "{pptx_path}" --outdir "{temp_dir}"',
shell=True,
capture_output=True,
text=True,
)
print("LibreOffice stdout:", result.stdout)
print("LibreOffice stderr:", result.stderr)
pdf_filename = f"{base_name}.pdf"
pdf_path = os.path.join(temp_dir, pdf_filename)
print(pdf_path)
return pdf_path
def get_images_from_pptx(pptx_path: str) -> List[str]:
temp_dir = os.path.dirname(pptx_path)
pdf_path = get_pdf_from_pptx(pptx_path, temp_dir)
return get_page_images_from_pdf(pdf_path, temp_dir)