aleph.ingest.document

DocumentIngestor

class aleph.ingest.document.DocumentIngestor

Imports

  • <UNKNOWN>
extract_pdf_alternative(self, meta, pdf_path)
generate_pdf_alternative(self, meta, local_path)

Convert LibreOffice-supported documents to PDF.

ingest(self, meta, local_path)

PlainTextIngestor

class aleph.ingest.document.PlainTextIngestor

Imports

  • aleph.ingest.document.DocumentIngestor
match(cls, meta, local_path)

PresentationIngestor

class aleph.ingest.document.PresentationIngestor

Imports

  • aleph.ingest.document.DocumentIngestor