feat(agent): add Web Search Agent using SerpAPI (#104)

* feat(agent): add Web Search Agent using SerpAPI Signed-off-by: royalpinto007 <royalpinto007@gmail.com> * feat(reasoning): enhance agent orchestration and fallback behavior Signed-off-by: royalpinto007 <royalpinto007@gmail.com> --------- Signed-off-by: royalpinto007 <royalpinto007@gmail.com>
video-db · Dec 24, 2024 · 9266f1d · 9266f1d
1 parent 604df70
commit 9266f1d
Show file tree

Hide file tree

Showing 5 changed files with 311 additions and 6 deletions.
diff --git a/backend/.env.sample b/backend/.env.sample
@@ -43,3 +43,5 @@ FAL_KEY=
 COMPOSIO_API_KEY=
 COMPOSIO_APPS=["HACKERNEWS"]
 
+# Web Search Agent
+SERP_API_KEY=
diff --git a/backend/director/agents/web_search_agent.py b/backend/director/agents/web_search_agent.py
@@ -0,0 +1,217 @@
+import logging
+import os
+import requests
+from dotenv import load_dotenv
+
+from director.agents.base import BaseAgent, AgentResponse, AgentStatus
+from director.core.session import (
+    Session,
+    VideosContent,
+    VideoData,
+    MsgStatus,
+)
+from director.tools.serp import SerpAPI
+from urllib.parse import urlparse, parse_qs
+
+load_dotenv()
+logger = logging.getLogger(__name__)
+
+SEARCH_AGENT_PARAMETERS = {
+    "type": "object",
+    "properties": {
+        "engine": {
+            "type": "string",
+            "description": "Engine to use for the search. Currently supports 'serp'.",
+            "enum": ["serp"],
+            "default": "serp",
+        },
+        "job_type": {
+            "type": "string",
+            "enum": ["search_videos"],
+            "description": "The type of search to perform. Possible value: search_videos.",
+        },
+        "search_videos": {
+            "type": "object",
+            "properties": {
+                "query": {
+                    "type": "string",
+                    "description": "Search query for the output.",
+                    "minLength": 1,
+                },
+                "count": {
+                    "type": "integer",
+                    "description": "Number of results to retrieve.",
+                    "default": 5,
+                    "minimum": 1,
+                    "maximum": 50,
+                },
+                "duration": {
+                    "type": "string",
+                    "description": "Filter videos by duration (short, medium, long).",
+                    "enum": ["short", "medium", "long"],
+                },
+                "serp_config": {
+                    "type": "object",
+                    "description": "Config to use when SerpAPI engine is used",
+                    "properties": {
+                        "base_url": {
+                            "type": "string",
+                            "description": "Base URL for the SerpAPI service"
+                        },
+                        "timeout": {
+                            "type": "integer",
+                            "description": "Timeout in seconds for API requests",
+                            "default": 10
+                        }
+                    }
+                },
+            },
+            "required": ["query"],
+        },
+    },
+    "required": ["job_type", "engine"],
+}
+
+SUPPORTED_ENGINES = ["serp"]
+
+class WebSearchAgent(BaseAgent):
+    def __init__(self, session: Session, **kwargs):
+        self.agent_name = "web_search"
+        self.description = (
+            "Performs web searches to find and retrieve relevant videos using various engines."
+        )
+        self.parameters = SEARCH_AGENT_PARAMETERS
+        super().__init__(session=session, **kwargs)
+
+    def run(
+        self,
+        engine: str,
+        job_type: str,
+        search_videos: dict | None = None,
+        *args,
+        **kwargs,
+    ) -> AgentResponse:
+        """
+        Perform a search using the specified engine and handle different job types.
+
+        :param engine: Search engine to use (e.g., 'serp').
+        :param job_type: Type of job to execute (e.g., 'search_videos').
+        :param search_videos: Parameters specific to the 'search_videos' job type.
+        :return: A structured response containing search results.
+        """
+        if engine not in SUPPORTED_ENGINES:
+            return AgentResponse(
+                status=AgentStatus.ERROR,
+                message=f"Engine '{engine}' is not supported.",
+            )
+
+        self.api_key = os.getenv("SERP_API_KEY")
+        if not self.api_key:
+            return AgentResponse(
+                status=AgentStatus.ERROR,
+                message="SERP_API_KEY environment variable is not set.",
+            )
+
+        serp_config = search_videos.get("serp_config", {})
+        search_engine_tool = SerpAPI(
+            api_key=self.api_key,
+            base_url=serp_config.get("base_url"),
+            timeout=serp_config.get("timeout", 10)
+        )
+
+        if job_type == "search_videos":
+            if not isinstance(search_videos, dict):
+                return AgentResponse(
+                    status=AgentStatus.ERROR,
+                    message="'search_videos' must be a dictionary.",
+                )
+            if not search_videos:
+                return AgentResponse(
+                    status=AgentStatus.ERROR,
+                    message="Parameters for 'search_videos' are required.",
+                )
+            return self._handle_video_search(search_videos, search_engine_tool)
+        else:
+            return AgentResponse(
+                status=AgentStatus.ERROR,
+                message=f"Unsupported job type: {job_type}.",
+            )
+
+    def _handle_video_search(self, search_videos: dict, search_engine_tool) -> AgentResponse:
+        """Handles video searches."""
+        query = search_videos.get("query")
+        count = search_videos.get("count", 5)
+        duration = search_videos.get("duration")
+        if not isinstance(count, int) or count < 1 or count > 50:
+            return AgentResponse(
+                status=AgentStatus.ERROR,
+                message="Count must be between 1 and 50",
+            )
+        if duration and duration not in ["short", "medium", "long"]:
+            return AgentResponse(
+                status=AgentStatus.ERROR,
+                message=f"Invalid duration value: {duration}",
+            )
+
+        if not query or not isinstance(query, str) or not query.strip():
+            return AgentResponse(
+                status=AgentStatus.ERROR,
+                message="Search query is required and cannot be empty.",
+            )
+
+        try:
+            results = search_engine_tool.search_videos(query=query, count=count, duration=duration)
+            valid_videos = []
+
+            for video in results:
+                external_url = video.get("link") or video.get("video_link")
+
+                # Skip non-video YouTube links
+                parsed_url = urlparse(external_url)
+                if parsed_url.netloc in ["youtube.com", "www.youtube.com"]:
+                    if any(parsed_url.path.startswith(prefix) for prefix in ["/channel/", "/@", "/c/", "/playlist"]):
+                        continue
+                    if not parsed_url.path.startswith("/watch") or not parse_qs(parsed_url.query).get("v"):
+                        continue
+
+                # Prepare video data
+                video_data = VideoData(
+                    external_url=external_url,
+                    name=video.get("title", "Untitled Video"),
+                    thumbnail_url=video.get("thumbnail"),
+                )
+                valid_videos.append(video_data)
+
+            if not valid_videos:
+                return AgentResponse(
+                    status=AgentStatus.ERROR,
+                    message="No valid videos were found.",
+                )
+
+            videos_content = VideosContent(
+                agent_name=self.agent_name,
+                status=MsgStatus.success,
+                status_message=f"Found {len(valid_videos)} videos.",
+                videos=valid_videos,
+            )
+            self.output_message.content.append(videos_content)
+            self.output_message.push_update()
+
+            return AgentResponse(
+                status=AgentStatus.SUCCESS,
+                message="Video search completed successfully.",
+                data={"videos": [video.dict() for video in valid_videos]},
+            )
+        except requests.exceptions.RequestException as e:
+            error_message = "An error occurred during the video search."
+            if isinstance(e, requests.exceptions.Timeout):
+                error_message = "The search request timed out. Please try again."
+            elif isinstance(e, requests.exceptions.HTTPError):
+                if getattr(e.response, 'status_code', None) == 429:
+                    error_message = "Rate limit exceeded. Please try again in a few minutes."
+                elif getattr(e.response, 'status_code', None) == 401:
+                    error_message = "API authentication failed. Please check your API key."
+            return AgentResponse(
+                status=AgentStatus.ERROR,
+                message=error_message,
+            )
diff --git a/backend/director/core/reasoning.py b/backend/director/core/reasoning.py
@@ -29,18 +29,21 @@
    - Iterate until the request is fully addressed or the user specifies "stop."
 
 2. **Fallback Behavior**:
-   - If `video_id` is unavailable:
-     - Use the `download` agent to retrieve the stream.
-     - Upload the stream to VideoDB to generate a `video_id`.
-     - Proceed with the original request.
+   - If a task requires a video_id but one is unavailable:
+     - For Stream URLs (m3u8), external URLs (e.g., YouTube links, direct video links, or videos hosted on other platforms):
+       - Use the upload agent to generate a video_id.
+       - Immediately proceed with the original task using the newly generated video_id.
 
 3. **Identity**:
    - Respond to identity-related queries with: "I am The Director, your AI assistant for video workflows and management."
    - Provide descriptions of all the agents.
 
 4. **Agent Usage**:
-   - Prefer `summary` agent for single-video context unless `search` is explicitly requested.
-   - Use `stream_video` agent for video playback requests.
+   - Always prioritize the appropriate agent for the task:
+     - Use summarize_video for summarization requests unless search is explicitly requested.
+     - For external video URLs, automatically upload and process them if required for further actions (e.g., summarization, indexing, or editing).
+     - Use stream_video for video playback.
+     - Ensure seamless workflows by automatically resolving missing dependencies (e.g., uploading external URLs for a missing video_id) without additional user intervention.
 
 5. **Clarity and Safety**:
    - Confirm with the user if a request is ambiguous.

diff --git a/backend/director/handler.py b/backend/director/handler.py
@@ -23,6 +23,7 @@
 from director.agents.meme_maker import MemeMakerAgent
 from director.agents.composio import ComposioAgent
 from director.agents.comparison import ComparisonAgent
+from director.agents.web_search_agent import WebSearchAgent
 
 
 from director.core.session import Session, InputMessage, MsgStatus
@@ -62,6 +63,7 @@ def __init__(self, db, **kwargs):
             MemeMakerAgent,
             ComposioAgent,
             ComparisonAgent,
+            WebSearchAgent,
         ]
 
     def add_videodb_state(self, session):

diff --git a/backend/director/tools/serp.py b/backend/director/tools/serp.py
@@ -0,0 +1,81 @@
+import requests
+from requests.adapters import HTTPAdapter
+from urllib3.util.retry import Retry
+
+
+class SerpAPI:
+    BASE_URL = "https://serpapi.com/search.json"
+    RETRY_TOTAL = 3
+    RETRY_BACKOFF_FACTOR = 1
+    RETRY_STATUS_CODES = [429, 500, 502, 503, 504]
+
+    def __init__(self, api_key: str, base_url: str = None, timeout: int = 10):
+        """
+        Initialize the SerpAPI client.
+        :param api_key: API key for SerpAPI.
+        :param base_url: Optional base URL for the API.
+        :param timeout: Timeout for API requests in seconds.
+        """
+        if not api_key:
+            raise ValueError("API key is required for SerpAPI.")
+        self.api_key = api_key
+        self.base_url = base_url or self.BASE_URL
+        self.timeout = timeout
+
+        # Configure retries
+        retry_strategy = Retry(
+            total=self.RETRY_TOTAL,
+            backoff_factor=self.RETRY_BACKOFF_FACTOR,
+            status_forcelist=self.RETRY_STATUS_CODES,
+        )
+        self.session = requests.Session()
+        adapter = HTTPAdapter(max_retries=retry_strategy)
+        self.session.mount("https://", adapter)
+
+    def search_videos(self, query: str, count: int, duration: str = None) -> list:
+        if not query or not query.strip():
+            raise ValueError("Search query cannot be empty.")
+        if not isinstance(count, int) or count < 1:
+            raise ValueError("Count must be a positive integer.")
+        """
+        Perform a video search using SerpAPI.
+        :param query: Search query for the video.
+        :param count: Number of video results to retrieve.
+        :param duration: Filter videos by duration (short, medium, long).
+        :return: A list of raw video results from SerpAPI.
+        """
+        params = {
+            "q": query,
+            "tbm": "vid",
+            "num": count,
+            "hl": "en",
+            "gl": "us",
+            "api_key": self.api_key,
+        }
+
+        # Map duration values to SerpAPI's expected format
+        duration_mapping = {
+            "short": "dur:s",
+            "medium": "dur:m",
+            "long": "dur:l",
+        }
+
+        if duration:
+            if duration not in duration_mapping:
+                raise ValueError(f"Invalid duration value: {duration}")
+            params["tbs"] = duration_mapping[duration]
+
+        try:
+            response = self.session.get(self.base_url, params=params, timeout=self.timeout)
+            response.raise_for_status()
+            try:
+                data = response.json()
+            except ValueError as e:
+                raise RuntimeError("Invalid JSON response from SerpAPI") from e
+
+            results = data.get("video_results")
+            if results is None:
+                raise RuntimeError("Unexpected response format: 'video_results' not found")
+            return results
+        except requests.exceptions.RequestException as e:
+            raise RuntimeError(f"Error during SerpAPI video search: {e}") from e