from crewai_tools.rag.chunkers.base_chunker import BaseChunker from typing import List, Optional class WebsiteChunker(BaseChunker): def __init__(self, chunk_size: int = 2500, chunk_overlap: int = 250, separators: Optional[List[str]] = None, keep_separator: bool = True): if separators is None: separators = [ "\n\n\n", # Major section breaks "\n\n", # Paragraph breaks "\n", # Line breaks ". ", # Sentence endings "! ", # Exclamation endings "? ", # Question endings "; ", # Semicolon breaks ", ", # Comma breaks " ", # Word breaks "", # Character level ] super().__init__(chunk_size, chunk_overlap, separators, keep_separator)