mirror of
https://github.com/crewAIInc/crewAI.git
synced 2026-01-11 09:08:31 +00:00
0b3f00e6 chore: update project version to 0.73.0 and revise uv.lock dependencies (#455) ad19b074 feat: replace embedchain with native crewai adapter (#451) git-subtree-dir: packages/tools git-subtree-split: 0b3f00e67c0dae24d188c292dc99759fd1c841f7
51 lines
1.5 KiB
Python
51 lines
1.5 KiB
Python
from typing import Optional, Type
|
|
|
|
from pydantic import BaseModel, Field
|
|
|
|
from ..rag.rag_tool import RagTool
|
|
from crewai_tools.rag.data_types import DataType
|
|
|
|
|
|
class FixedPDFSearchToolSchema(BaseModel):
|
|
"""Input for PDFSearchTool."""
|
|
|
|
query: str = Field(
|
|
..., description="Mandatory query you want to use to search the PDF's content"
|
|
)
|
|
|
|
|
|
class PDFSearchToolSchema(FixedPDFSearchToolSchema):
|
|
"""Input for PDFSearchTool."""
|
|
|
|
pdf: str = Field(..., description="File path or URL of a PDF file to be searched")
|
|
|
|
|
|
class PDFSearchTool(RagTool):
|
|
name: str = "Search a PDF's content"
|
|
description: str = (
|
|
"A tool that can be used to semantic search a query from a PDF's content."
|
|
)
|
|
args_schema: Type[BaseModel] = PDFSearchToolSchema
|
|
|
|
def __init__(self, pdf: Optional[str] = None, **kwargs):
|
|
super().__init__(**kwargs)
|
|
if pdf is not None:
|
|
self.add(pdf)
|
|
self.description = f"A tool that can be used to semantic search a query the {pdf} PDF's content."
|
|
self.args_schema = FixedPDFSearchToolSchema
|
|
self._generate_description()
|
|
|
|
def add(self, pdf: str) -> None:
|
|
super().add(pdf, data_type=DataType.PDF_FILE)
|
|
|
|
def _run(
|
|
self,
|
|
query: str,
|
|
pdf: Optional[str] = None,
|
|
similarity_threshold: float | None = None,
|
|
limit: int | None = None,
|
|
) -> str:
|
|
if pdf is not None:
|
|
self.add(pdf)
|
|
return super()._run(query=query, similarity_threshold=similarity_threshold, limit=limit)
|