feat: integrate with docling (#471) bump:patch
* feat: add docling reader implementation * feat: expose docling to UI * fix: improve docling output parsing * docs: update README --------- Co-authored-by: Tadashi <tadashi@cinnamon.is>
This commit is contained in:
@@ -39,6 +39,7 @@ from kotaemon.indices.ingests.files import (
|
||||
KH_DEFAULT_FILE_EXTRACTORS,
|
||||
adobe_reader,
|
||||
azure_reader,
|
||||
docling_reader,
|
||||
unstructured,
|
||||
web_reader,
|
||||
)
|
||||
@@ -673,6 +674,8 @@ class IndexDocumentPipeline(BaseFileIndexIndexing):
|
||||
readers[".pdf"] = adobe_reader
|
||||
elif self.reader_mode == "azure-di":
|
||||
readers[".pdf"] = azure_reader
|
||||
elif self.reader_mode == "docling":
|
||||
readers[".pdf"] = docling_reader
|
||||
|
||||
dev_readers, _, _ = dev_settings()
|
||||
readers.update(dev_readers)
|
||||
@@ -692,6 +695,7 @@ class IndexDocumentPipeline(BaseFileIndexIndexing):
|
||||
"Azure AI Document Intelligence (figure+table extraction)",
|
||||
"azure-di",
|
||||
),
|
||||
("Docling", "docling"),
|
||||
],
|
||||
"component": "dropdown",
|
||||
},
|
||||
|
Reference in New Issue
Block a user