diff --git a/docs/source/tutorials/add_new_doc_type.rst b/docs/source/tutorials/add_new_doc_type.rst index f8d0b148..0496f14d 100644 --- a/docs/source/tutorials/add_new_doc_type.rst +++ b/docs/source/tutorials/add_new_doc_type.rst @@ -103,6 +103,11 @@ General scheme of adding AttachmentExtractor def __init__(self) -> None: self.attachment_extractor = PdfAttachmentsExtractor() + def read(self, path: str, document_type: Optional[str] = None, parameters: Optional[dict] = None) -> UnstructuredDocument: + # some code + attachments = self.attachment_extractor.get_attachments(tmpdir, filename, parameters) + # some code + Example of adding pdf/djvu handlers -----------------------------------