kotaemon/knowledgehub/indices/extractors/doc_parsers.py
2023-11-27 14:25:54 +07:00

20 lines
452 B
Python

from ..base import DocTransformer, LlamaIndexMixin
class BaseDocParser(DocTransformer):
...
class TitleExtractor(LlamaIndexMixin, BaseDocParser):
def _get_li_class(self):
from llama_index.extractors import TitleExtractor
return TitleExtractor
class SummaryExtractor(LlamaIndexMixin, BaseDocParser):
def _get_li_class(self):
from llama_index.extractors import SummaryExtractor
return SummaryExtractor