aleph.ingest.text

PDFIngestor

class aleph.ingest.text.PDFIngestor

Imports

  • aleph.ingest.text.TextIngestor
match(cls, meta, local_path)
ingest(self, meta, local_path)

TextIngestor

class aleph.ingest.text.TextIngestor

Imports

  • <UNKNOWN>
create_document(self, meta)
create_page(self, document, text)
extract_pdf(self, meta, pdf_path)
store_pdf(self, meta, pdf_path)