Source code for dedoc.converters.concrete_converters.pdf_converter

import os
from typing import Optional

from dedoc.converters.concrete_converters.abstract_converter import AbstractConverter
from dedoc.extensions import converted_extensions, converted_mimes


[docs]class PDFConverter(AbstractConverter): """ Converts pdf-like documents into PDF using the ddjvu application. Look to the :class:`~dedoc.converters.AbstractConverter` documentation to get the information about the methods' parameters. """ def __init__(self, *, config: dict) -> None: super().__init__(config=config) self.timeout = 60
[docs] def can_convert(self, extension: str, mime: str, parameters: Optional[dict] = None) -> bool: """ Checks if the document is pdf-like, e.g. it has .djvu extension. """ return extension.lower() in converted_extensions.pdf_like_format or mime in converted_mimes.pdf_like_format
[docs] def do_convert(self, tmp_dir: str, filename: str, extension: str) -> str: """ Convert the pdf-like documents into files with .pdf extension using the ddjvu application. """ path_in = os.path.join(tmp_dir, f"{filename}{extension}") expected_path = os.path.join(tmp_dir, f"{filename}.pdf") command = ["ddjvu", "--format=pdf", path_in, expected_path] self._run_subprocess(command=command, filename=filename, expected_path=expected_path) return filename + ".pdf"