Separate rerankers, splitters and extractors (#85)
This commit is contained in:
committed by
GitHub
parent
0dede9c82d
commit
2186c5558f
7
knowledgehub/indices/extractors/__init__.py
Normal file
7
knowledgehub/indices/extractors/__init__.py
Normal file
@@ -0,0 +1,7 @@
|
||||
from .doc_parsers import BaseDocParser, SummaryExtractor, TitleExtractor
|
||||
|
||||
__all__ = [
|
||||
"BaseDocParser",
|
||||
"TitleExtractor",
|
||||
"SummaryExtractor",
|
||||
]
|
19
knowledgehub/indices/extractors/doc_parsers.py
Normal file
19
knowledgehub/indices/extractors/doc_parsers.py
Normal file
@@ -0,0 +1,19 @@
|
||||
from ..base import DocTransformer, LlamaIndexMixin
|
||||
|
||||
|
||||
class BaseDocParser(DocTransformer):
|
||||
...
|
||||
|
||||
|
||||
class TitleExtractor(LlamaIndexMixin, BaseDocParser):
|
||||
def _get_li_class(self):
|
||||
from llama_index.extractors import TitleExtractor
|
||||
|
||||
return TitleExtractor
|
||||
|
||||
|
||||
class SummaryExtractor(LlamaIndexMixin, BaseDocParser):
|
||||
def _get_li_class(self):
|
||||
from llama_index.extractors import SummaryExtractor
|
||||
|
||||
return SummaryExtractor
|
Reference in New Issue
Block a user