Enforce all IO objects to be subclassed from Document (#88)

* enforce Document as IO

* Separate rerankers, splitters and extractors (#85)

* partially refractor importing

* add text to embedding outputs

---------

Co-authored-by: Nguyen Trung Duc (john) <trungduc1992@gmail.com>
This commit is contained in:
ian_Cin
2023-11-27 16:35:09 +07:00
committed by GitHub
parent 2186c5558f
commit 8e0779a22d
13 changed files with 108 additions and 59 deletions

View File

@@ -1,7 +1,7 @@
from __future__ import annotations
from abc import abstractmethod
from typing import Any, Sequence, Type
from typing import Any, Type
from llama_index.node_parser.interface import NodeParser
@@ -20,9 +20,9 @@ class DocTransformer(BaseComponent):
@abstractmethod
def run(
self,
documents: Sequence[Document],
documents: list[Document],
**kwargs,
) -> Sequence[Document]:
) -> list[Document]:
...
@@ -62,9 +62,9 @@ class LlamaIndexMixin:
def run(
self,
documents: Sequence[Document],
documents: list[Document],
**kwargs,
) -> Sequence[Document]:
) -> list[Document]:
"""Run Llama-index node parser and convert the output to Document from
kotaemon
"""