langchain_community.document_loaders.parsers.language.c ηζΊδ»£η
from typing import TYPE_CHECKING
from langchain_community.document_loaders.parsers.language.tree_sitter_segmenter import ( # noqa: E501
TreeSitterSegmenter,
)
if TYPE_CHECKING:
from tree_sitter import Language
CHUNK_QUERY = """
[
(struct_specifier
body: (field_declaration_list)) @struct
(enum_specifier
body: (enumerator_list)) @enum
(union_specifier
body: (field_declaration_list)) @union
(function_definition) @function
]
""".strip()
[docs]
class CSegmenter(TreeSitterSegmenter):
"""Code segmenter for C."""
[docs]
def get_language(self) -> "Language":
from tree_sitter_languages import get_language
return get_language("c")
[docs]
def get_chunk_query(self) -> str:
return CHUNK_QUERY