Squashed 'packages/tools/' content from commit 78317b9c

git-subtree-dir: packages/tools git-subtree-split: 78317b9c127f18bd040c1d77e3c0840cdc9a5b38
2026-05-01 23:32:39 +00:00 · 2025-09-12 21:58:02 -04:00
commit e16606672a
303 changed files with 49010 additions and 0 deletions
--- a/crewai_tools/aws/bedrock/browser/browser_toolkit.py
+++ b/crewai_tools/aws/bedrock/browser/browser_toolkit.py
@@ -0,0 +1,587 @@
+"""Toolkit for navigating web with AWS browser."""
+
+import json
+import logging
+import asyncio
+from typing import Dict, List, Tuple, Any, Type
+from urllib.parse import urlparse
+
+from crewai.tools import BaseTool
+from pydantic import BaseModel, Field
+
+from .browser_session_manager import BrowserSessionManager
+from .utils import aget_current_page, get_current_page
+
+logger = logging.getLogger(__name__)
+
+
+# Input schemas
+class NavigateToolInput(BaseModel):
+    """Input for NavigateTool."""
+    url: str = Field(description="URL to navigate to")
+    thread_id: str = Field(default="default", description="Thread ID for the browser session")
+
+
+class ClickToolInput(BaseModel):
+    """Input for ClickTool."""
+    selector: str = Field(description="CSS selector for the element to click on")
+    thread_id: str = Field(default="default", description="Thread ID for the browser session")
+
+
+class GetElementsToolInput(BaseModel):
+    """Input for GetElementsTool."""
+    selector: str = Field(description="CSS selector for elements to get")
+    thread_id: str = Field(default="default", description="Thread ID for the browser session")
+
+
+class ExtractTextToolInput(BaseModel):
+    """Input for ExtractTextTool."""
+    thread_id: str = Field(default="default", description="Thread ID for the browser session")
+
+
+class ExtractHyperlinksToolInput(BaseModel):
+    """Input for ExtractHyperlinksTool."""
+    thread_id: str = Field(default="default", description="Thread ID for the browser session")
+
+
+class NavigateBackToolInput(BaseModel):
+    """Input for NavigateBackTool."""
+    thread_id: str = Field(default="default", description="Thread ID for the browser session")
+
+
+class CurrentWebPageToolInput(BaseModel):
+    """Input for CurrentWebPageTool."""
+    thread_id: str = Field(default="default", description="Thread ID for the browser session")
+
+
+# Base tool class
+class BrowserBaseTool(BaseTool):
+    """Base class for browser tools."""
+    
+    def __init__(self, session_manager: BrowserSessionManager):
+        """Initialize with a session manager."""
+        super().__init__()
+        self._session_manager = session_manager
+        
+        if self._is_in_asyncio_loop() and hasattr(self, '_arun'):
+            self._original_run = self._run
+            # Override _run to use _arun when in an asyncio loop
+            def patched_run(*args, **kwargs):
+                try:
+                    import nest_asyncio
+                    loop = asyncio.get_event_loop()
+                    nest_asyncio.apply(loop)
+                    return asyncio.get_event_loop().run_until_complete(
+                        self._arun(*args, **kwargs)
+                    )
+                except Exception as e:
+                    return f"Error in patched _run: {str(e)}"
+            self._run = patched_run
+        
+    async def get_async_page(self, thread_id: str) -> Any:
+        """Get or create a page for the specified thread."""
+        browser = await self._session_manager.get_async_browser(thread_id)
+        page = await aget_current_page(browser)
+        return page
+        
+    def get_sync_page(self, thread_id: str) -> Any:
+        """Get or create a page for the specified thread."""
+        browser = self._session_manager.get_sync_browser(thread_id)
+        page = get_current_page(browser)
+        return page
+    
+    def _is_in_asyncio_loop(self) -> bool:
+        """Check if we're currently in an asyncio event loop."""
+        try:
+            loop = asyncio.get_event_loop()
+            return loop.is_running()
+        except RuntimeError:
+            return False
+
+
+# Tool classes
+class NavigateTool(BrowserBaseTool):
+    """Tool for navigating a browser to a URL."""
+
+    name: str = "navigate_browser"
+    description: str = "Navigate a browser to the specified URL"
+    args_schema: Type[BaseModel] = NavigateToolInput
+    
+    def _run(self, url: str, thread_id: str = "default", **kwargs) -> str:
+        """Use the sync tool."""
+        try:
+            # Get page for this thread
+            page = self.get_sync_page(thread_id)
+
+            # Validate URL scheme
+            parsed_url = urlparse(url)
+            if parsed_url.scheme not in ("http", "https"):
+                raise ValueError("URL scheme must be 'http' or 'https'")
+
+            # Navigate to URL
+            response = page.goto(url)
+            status = response.status if response else "unknown"
+            return f"Navigating to {url} returned status code {status}"
+        except Exception as e:
+            return f"Error navigating to {url}: {str(e)}"
+
+    async def _arun(self, url: str, thread_id: str = "default", **kwargs) -> str:
+        """Use the async tool."""
+        try:
+            # Get page for this thread
+            page = await self.get_async_page(thread_id)
+
+            # Validate URL scheme
+            parsed_url = urlparse(url)
+            if parsed_url.scheme not in ("http", "https"):
+                raise ValueError("URL scheme must be 'http' or 'https'")
+
+            # Navigate to URL
+            response = await page.goto(url)
+            status = response.status if response else "unknown"
+            return f"Navigating to {url} returned status code {status}"
+        except Exception as e:
+            return f"Error navigating to {url}: {str(e)}"
+
+
+class ClickTool(BrowserBaseTool):
+    """Tool for clicking on an element with the given CSS selector."""
+
+    name: str = "click_element"
+    description: str = "Click on an element with the given CSS selector"
+    args_schema: Type[BaseModel] = ClickToolInput
+    
+    visible_only: bool = True
+    """Whether to consider only visible elements."""
+    playwright_strict: bool = False
+    """Whether to employ Playwright's strict mode when clicking on elements."""
+    playwright_timeout: float = 1_000
+    """Timeout (in ms) for Playwright to wait for element to be ready."""
+
+    def _selector_effective(self, selector: str) -> str:
+        if not self.visible_only:
+            return selector
+        return f"{selector} >> visible=1"
+    
+    def _run(self, selector: str, thread_id: str = "default", **kwargs) -> str:
+        """Use the sync tool."""
+        try:
+            # Get the current page
+            page = self.get_sync_page(thread_id)
+
+            # Click on the element
+            selector_effective = self._selector_effective(selector=selector)
+            from playwright.sync_api import TimeoutError as PlaywrightTimeoutError
+            
+            try:
+                page.click(
+                    selector_effective,
+                    strict=self.playwright_strict,
+                    timeout=self.playwright_timeout,
+                )
+            except PlaywrightTimeoutError:
+                return f"Unable to click on element '{selector}'"
+            except Exception as click_error:
+                return f"Unable to click on element '{selector}': {str(click_error)}"
+            
+            return f"Clicked element '{selector}'"
+        except Exception as e:
+            return f"Error clicking on element: {str(e)}"
+
+    async def _arun(self, selector: str, thread_id: str = "default", **kwargs) -> str:
+        """Use the async tool."""
+        try:
+            # Get the current page
+            page = await self.get_async_page(thread_id)
+
+            # Click on the element
+            selector_effective = self._selector_effective(selector=selector)
+            from playwright.async_api import TimeoutError as PlaywrightTimeoutError
+            
+            try:
+                await page.click(
+                    selector_effective,
+                    strict=self.playwright_strict,
+                    timeout=self.playwright_timeout,
+                )
+            except PlaywrightTimeoutError:
+                return f"Unable to click on element '{selector}'"
+            except Exception as click_error:
+                return f"Unable to click on element '{selector}': {str(click_error)}"
+            
+            return f"Clicked element '{selector}'"
+        except Exception as e:
+            return f"Error clicking on element: {str(e)}"
+
+
+class NavigateBackTool(BrowserBaseTool):
+    """Tool for navigating back in browser history."""
+    name: str = "navigate_back"
+    description: str = "Navigate back to the previous page"
+    args_schema: Type[BaseModel] = NavigateBackToolInput
+    
+    def _run(self, thread_id: str = "default", **kwargs) -> str:
+        """Use the sync tool."""
+        try:
+            # Get the current page
+            page = self.get_sync_page(thread_id)
+
+            # Navigate back
+            try:
+                page.go_back()
+                return "Navigated back to the previous page"
+            except Exception as nav_error:
+                return f"Unable to navigate back: {str(nav_error)}"
+        except Exception as e:
+            return f"Error navigating back: {str(e)}"
+
+    async def _arun(self, thread_id: str = "default", **kwargs) -> str:
+        """Use the async tool."""
+        try:
+            # Get the current page
+            page = await self.get_async_page(thread_id)
+
+            # Navigate back
+            try:
+                await page.go_back()
+                return "Navigated back to the previous page"
+            except Exception as nav_error:
+                return f"Unable to navigate back: {str(nav_error)}"
+        except Exception as e:
+            return f"Error navigating back: {str(e)}"
+
+
+class ExtractTextTool(BrowserBaseTool):
+    """Tool for extracting text from a webpage."""
+    name: str = "extract_text"
+    description: str = "Extract all the text on the current webpage"
+    args_schema: Type[BaseModel] = ExtractTextToolInput
+    
+    def _run(self, thread_id: str = "default", **kwargs) -> str:
+        """Use the sync tool."""
+        try:
+            # Import BeautifulSoup
+            try:
+                from bs4 import BeautifulSoup
+            except ImportError:
+                return (
+                    "The 'beautifulsoup4' package is required to use this tool."
+                    " Please install it with 'pip install beautifulsoup4'."
+                )
+                
+            # Get the current page
+            page = self.get_sync_page(thread_id)
+
+            # Extract text
+            content = page.content()
+            soup = BeautifulSoup(content, "html.parser")
+            return soup.get_text(separator="\n").strip()
+        except Exception as e:
+            return f"Error extracting text: {str(e)}"
+
+    async def _arun(self, thread_id: str = "default", **kwargs) -> str:
+        """Use the async tool."""
+        try:
+            # Import BeautifulSoup
+            try:
+                from bs4 import BeautifulSoup
+            except ImportError:
+                return (
+                    "The 'beautifulsoup4' package is required to use this tool."
+                    " Please install it with 'pip install beautifulsoup4'."
+                )
+                
+            # Get the current page
+            page = await self.get_async_page(thread_id)
+
+            # Extract text
+            content = await page.content()
+            soup = BeautifulSoup(content, "html.parser")
+            return soup.get_text(separator="\n").strip()
+        except Exception as e:
+            return f"Error extracting text: {str(e)}"
+
+
+class ExtractHyperlinksTool(BrowserBaseTool):
+    """Tool for extracting hyperlinks from a webpage."""
+    name: str = "extract_hyperlinks"
+    description: str = "Extract all hyperlinks on the current webpage"
+    args_schema: Type[BaseModel] = ExtractHyperlinksToolInput
+    
+    def _run(self, thread_id: str = "default", **kwargs) -> str:
+        """Use the sync tool."""
+        try:
+            # Import BeautifulSoup
+            try:
+                from bs4 import BeautifulSoup
+            except ImportError:
+                return (
+                    "The 'beautifulsoup4' package is required to use this tool."
+                    " Please install it with 'pip install beautifulsoup4'."
+                )
+                
+            # Get the current page
+            page = self.get_sync_page(thread_id)
+
+            # Extract hyperlinks
+            content = page.content()
+            soup = BeautifulSoup(content, "html.parser")
+            links = []
+            for link in soup.find_all("a", href=True):
+                text = link.get_text().strip()
+                href = link["href"]
+                if href.startswith("http") or href.startswith("https"):
+                    links.append({"text": text, "url": href})
+            
+            if not links:
+                return "No hyperlinks found on the current page."
+            
+            return json.dumps(links, indent=2)
+        except Exception as e:
+            return f"Error extracting hyperlinks: {str(e)}"
+
+    async def _arun(self, thread_id: str = "default", **kwargs) -> str:
+        """Use the async tool."""
+        try:
+            # Import BeautifulSoup
+            try:
+                from bs4 import BeautifulSoup
+            except ImportError:
+                return (
+                    "The 'beautifulsoup4' package is required to use this tool."
+                    " Please install it with 'pip install beautifulsoup4'."
+                )
+                
+            # Get the current page
+            page = await self.get_async_page(thread_id)
+
+            # Extract hyperlinks
+            content = await page.content()
+            soup = BeautifulSoup(content, "html.parser")
+            links = []
+            for link in soup.find_all("a", href=True):
+                text = link.get_text().strip()
+                href = link["href"]
+                if href.startswith("http") or href.startswith("https"):
+                    links.append({"text": text, "url": href})
+            
+            if not links:
+                return "No hyperlinks found on the current page."
+            
+            return json.dumps(links, indent=2)
+        except Exception as e:
+            return f"Error extracting hyperlinks: {str(e)}"
+
+
+class GetElementsTool(BrowserBaseTool):
+    """Tool for getting elements from a webpage."""
+    name: str = "get_elements"
+    description: str = "Get elements from the webpage using a CSS selector"
+    args_schema: Type[BaseModel] = GetElementsToolInput
+    
+    def _run(self, selector: str, thread_id: str = "default", **kwargs) -> str:
+        """Use the sync tool."""
+        try:
+            # Get the current page
+            page = self.get_sync_page(thread_id)
+
+            # Get elements
+            elements = page.query_selector_all(selector)
+            if not elements:
+                return f"No elements found with selector '{selector}'"
+            
+            elements_text = []
+            for i, element in enumerate(elements):
+                text = element.text_content()
+                elements_text.append(f"Element {i+1}: {text.strip()}")
+            
+            return "\n".join(elements_text)
+        except Exception as e:
+            return f"Error getting elements: {str(e)}"
+
+    async def _arun(self, selector: str, thread_id: str = "default", **kwargs) -> str:
+        """Use the async tool."""
+        try:
+            # Get the current page
+            page = await self.get_async_page(thread_id)
+
+            # Get elements
+            elements = await page.query_selector_all(selector)
+            if not elements:
+                return f"No elements found with selector '{selector}'"
+            
+            elements_text = []
+            for i, element in enumerate(elements):
+                text = await element.text_content()
+                elements_text.append(f"Element {i+1}: {text.strip()}")
+            
+            return "\n".join(elements_text)
+        except Exception as e:
+            return f"Error getting elements: {str(e)}"
+
+
+class CurrentWebPageTool(BrowserBaseTool):
+    """Tool for getting information about the current webpage."""
+    name: str = "current_webpage"
+    description: str = "Get information about the current webpage"
+    args_schema: Type[BaseModel] = CurrentWebPageToolInput
+    
+    def _run(self, thread_id: str = "default", **kwargs) -> str:
+        """Use the sync tool."""
+        try:
+            # Get the current page
+            page = self.get_sync_page(thread_id)
+
+            # Get information
+            url = page.url
+            title = page.title()
+            return f"URL: {url}\nTitle: {title}"
+        except Exception as e:
+            return f"Error getting current webpage info: {str(e)}"
+
+    async def _arun(self, thread_id: str = "default", **kwargs) -> str:
+        """Use the async tool."""
+        try:
+            # Get the current page
+            page = await self.get_async_page(thread_id)
+
+            # Get information
+            url = page.url
+            title = await page.title()
+            return f"URL: {url}\nTitle: {title}"
+        except Exception as e:
+            return f"Error getting current webpage info: {str(e)}"
+
+
+class BrowserToolkit:
+    """Toolkit for navigating web with AWS Bedrock browser.
+
+    This toolkit provides a set of tools for working with a remote browser
+    and supports multiple threads by maintaining separate browser sessions
+    for each thread ID. Browsers are created lazily only when needed.
+
+    Example:
+        ```python
+        from crewai import Agent, Task, Crew
+        from crewai_tools.aws.bedrock.browser import create_browser_toolkit
+
+        # Create the browser toolkit
+        toolkit, browser_tools = create_browser_toolkit(region="us-west-2")
+
+        # Create a CrewAI agent that uses the browser tools
+        research_agent = Agent(
+            role="Web Researcher",
+            goal="Research and summarize web content",
+            backstory="You're an expert at finding information online.",
+            tools=browser_tools
+        )
+
+        # Create a task for the agent
+        research_task = Task(
+            description="Navigate to https://example.com and extract all text content. Summarize the main points.",
+            agent=research_agent
+        )
+
+        # Create and run the crew
+        crew = Crew(
+            agents=[research_agent],
+            tasks=[research_task]
+        )
+        result = crew.kickoff()
+
+        # Clean up browser resources when done
+        import asyncio
+        asyncio.run(toolkit.cleanup())
+        ```
+    """
+
+    def __init__(self, region: str = "us-west-2"):
+        """
+        Initialize the toolkit
+
+        Args:
+            region: AWS region for the browser client
+        """
+        self.region = region
+        self.session_manager = BrowserSessionManager(region=region)
+        self.tools: List[BaseTool] = []
+        self._nest_current_loop()
+        self._setup_tools()
+    
+    def _nest_current_loop(self):
+        """Apply nest_asyncio if we're in an asyncio loop."""
+        try:
+            loop = asyncio.get_event_loop()
+            if loop.is_running():
+                try:
+                    import nest_asyncio
+                    nest_asyncio.apply(loop)
+                except Exception as e:
+                    logger.warning(f"Failed to apply nest_asyncio: {str(e)}")
+        except RuntimeError:
+            pass
+
+    def _setup_tools(self) -> None:
+        """Initialize tools without creating any browsers."""
+        self.tools = [
+            NavigateTool(session_manager=self.session_manager),
+            ClickTool(session_manager=self.session_manager),
+            NavigateBackTool(session_manager=self.session_manager),
+            ExtractTextTool(session_manager=self.session_manager),
+            ExtractHyperlinksTool(session_manager=self.session_manager),
+            GetElementsTool(session_manager=self.session_manager),
+            CurrentWebPageTool(session_manager=self.session_manager)
+        ]
+
+    def get_tools(self) -> List[BaseTool]:
+        """
+        Get the list of browser tools
+
+        Returns:
+            List of CrewAI tools
+        """
+        return self.tools
+
+    def get_tools_by_name(self) -> Dict[str, BaseTool]:
+        """
+        Get a dictionary of tools mapped by their names
+
+        Returns:
+            Dictionary of {tool_name: tool}
+        """
+        return {tool.name: tool for tool in self.tools}
+
+    async def cleanup(self) -> None:
+        """Clean up all browser sessions asynchronously"""
+        await self.session_manager.close_all_browsers()
+        logger.info("All browser sessions cleaned up")
+        
+    def sync_cleanup(self) -> None:
+        """Clean up all browser sessions from synchronous code"""
+        import asyncio
+        
+        try:
+            loop = asyncio.get_event_loop()
+            if loop.is_running():
+                asyncio.create_task(self.cleanup())
+            else:
+                loop.run_until_complete(self.cleanup())
+        except RuntimeError:
+            asyncio.run(self.cleanup())
+
+
+def create_browser_toolkit(
+    region: str = "us-west-2",
+) -> Tuple[BrowserToolkit, List[BaseTool]]:
+    """
+    Create a BrowserToolkit
+
+    Args:
+        region: AWS region for browser client
+
+    Returns:
+        Tuple of (toolkit, tools)
+    """
+    toolkit = BrowserToolkit(region=region)
+    tools = toolkit.get_tools()
+    return toolkit, tools