opea-project
diff --git a/‎ChatQnA/docker_compose/intel/hpu/gaudi/compose.yaml‎
Lines changed: 0 additions & 1 deletion b/‎ChatQnA/docker_compose/intel/hpu/gaudi/compose.yaml‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎DeepResearchAgent/Dockerfile‎
Lines changed: 2 additions & 2 deletions b/‎DeepResearchAgent/Dockerfile‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎DeepResearchAgent/README.md‎
Lines changed: 7 additions & 4 deletions b/‎DeepResearchAgent/README.md‎
Lines changed: 7 additions & 4 deletions
diff --git a/‎DeepResearchAgent/agent_factory.py‎
Lines changed: 0 additions & 68 deletions b/‎DeepResearchAgent/agent_factory.py‎
Lines changed: 0 additions & 68 deletions
diff --git a/‎DeepResearchAgent/assets/img/opea-deep-research-agent.png‎
52.8 KB b/‎DeepResearchAgent/assets/img/opea-deep-research-agent.png‎
52.8 KB
diff --git a/‎DeepResearchAgent/deep_researcher.yaml‎
Lines changed: 11 additions & 0 deletions b/‎DeepResearchAgent/deep_researcher.yaml‎
Lines changed: 11 additions & 0 deletions
diff --git a/‎DeepResearchAgent/docker_compose/intel/hpu/gaudi/compose.yaml‎
Lines changed: 1 addition & 1 deletion b/‎DeepResearchAgent/docker_compose/intel/hpu/gaudi/compose.yaml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎DeepResearchAgent/docker_compose/intel/hpu/gaudi/set_env.sh‎
Lines changed: 18 additions & 75 deletions b/‎DeepResearchAgent/docker_compose/intel/hpu/gaudi/set_env.sh‎
Lines changed: 18 additions & 75 deletions
diff --git a/‎DeepResearchAgent/requirements.in‎
Lines changed: 0 additions & 8 deletions b/‎DeepResearchAgent/requirements.in‎
Lines changed: 0 additions & 8 deletions
@@ -109,7 +109,6 @@ services:
       NUM_CARDS: ${NUM_CARDS}
       HF_HUB_OFFLINE: ${HF_HUB_OFFLINE:-0}
       VLLM_TORCH_PROFILER_DIR: "/mnt"
-      VLLM_SKIP_WARMUP: true
     healthcheck:
       test: ["CMD-SHELL", "curl -f http://localhost:80/health || exit 1"]
       interval: 10s
 
@@ -5,9 +5,9 @@ ARG IMAGE_REPO=opea
 ARG BASE_TAG=latest
 FROM opea/comps-base:$BASE_TAG
 
-COPY ./research_agents $HOME/research_agents
+COPY ./deep_researcher.yaml $HOME/deep_researcher.yaml
+COPY ./utils.py $HOME/utils.py
 COPY ./requirements.txt $HOME/requirements.txt
-COPY ./agent_factory.py $HOME/agent_factory.py
 COPY ./research_agent.py $HOME/research_agent.py
 
 USER root
 
@@ -4,15 +4,17 @@ Deep Research Agents are a new class of autonomous AI systems designed to perfor
 
 ## Overview
 
-In this application, we leverage the deep research agent implementation of [langchain-ai/deepagents](https://github.com/langchain-ai/deepagents), and deploy it on the Intel platform with opea microserice.
+In this application, we leverage the deep research agent implementation of [langchain-ai/open_deep_research](https://github.com/langchain-ai/open_deep_research), and deploy it on the Intel platform with opea microserice.
 
+![Architecture Overview](assets/img/opea-deep-research-agent.png)
 
 ## Setup Deployment Environment
 
-```shell
+```
+# Configure deep_researcher.yaml with your llm model served by the vllm
+
 # get your TAVILY_API_KEY from https://app.tavily.com/
 export TAVILY_API_KEY=""
-
 # get your HuggingFace Access Token from https://huggingface.co/docs/transformers.js/en/guides/private#step-1-generating-a-user-access-token
 export HF_TOKEN=""
 
@@ -29,8 +31,9 @@ source ./set_env.sh
 
 To deploy the Deep Research Agent services, execute the docker compose up command with the appropriate arguments. For a default deployment, execute:
 
-```shell
+```
 docker compose -f docker_compose/intel/hpu/gaudi/compose.yaml up -d
+
 ```
 
 ## Validate Microservice
 
@@ -0,0 +1,11 @@
+# Copyright (C) 2025 Intel Corporation
+# SPDX-License-Identifier: Apache-2.0
+
+agent:
+  type: langchain_deep_researcher
+  search_api: "tavily"
+  planner_provider: "openai"
+  planner_model: "meta-llama/Llama-3.3-70B-Instruct"
+  writer_provider: "openai"
+  writer_model: "meta-llama/Llama-3.3-70B-Instruct"
+  max_search_depth: 2
@@ -45,7 +45,7 @@ services:
     cap_add:
       - SYS_NICE
     ipc: host
-    command: --model ${LLM_MODEL_ID} --tensor-parallel-size ${NUM_CARDS} --enable-auto-tool-choice --tool-call-parser llama3_json --host 0.0.0.0 --port 8000 --max-seq-len-to-capture $MAX_LEN
+    command: --model ${LLM_MODEL_ID} --tensor-parallel-size ${NUM_CARDS} --host 0.0.0.0 --port 8000 --max-seq-len-to-capture $MAX_LEN
 
   deep-research-agent-server:
     image: ${REGISTRY:-opea}/deep-research-agent:${TAG:-latest}
 
@@ -3,102 +3,45 @@
 # Copyright (C) 2024 Intel Corporation
 # SPDX-License-Identifier: Apache-2.0
 
-# ==============================================================================
-# Environment Configuration for DeepResearchAgent on Intel Gaudi HPU
-# ==============================================================================
-
-# Get the directory where this script is located
+# Navigate to the parent directory and source the environment
 SCRIPT_DIR="$(cd -- "$(dirname -- "${BASH_SOURCE[0]}")" &> /dev/null && pwd)"
 
-# Source the parent environment configuration file
 pushd "$SCRIPT_DIR/../../../../../" > /dev/null
 source .set_env.sh
 popd > /dev/null
 
-# ------------------------------------------------------------------------------
-# Helper Functions
-# ------------------------------------------------------------------------------
-
-# Validates that a required environment variable is set
+# Function to check if a variable is set
 check_var() {
     local var_name="$1"
     local var_value="${!var_name}"
     if [ -z "${var_value}" ]; then
         echo "Error: ${var_name} is not set. Please set ${var_name}."
-        return 1  # Return error but don't exit to allow other checks to run
+        return 1  # Return an error code but do not exit the script
     fi
 }
 
-# ------------------------------------------------------------------------------
-# Validate Required API Keys
-# ------------------------------------------------------------------------------
-
-check_var "HF_TOKEN"        # HuggingFace token for model access
-check_var "TAVILY_API_KEY"  # Tavily API key for web search functionality
-
-# ------------------------------------------------------------------------------
-# Network Configuration
-# ------------------------------------------------------------------------------
-
-# Detect the primary IP address of the host machine
+# Check critical variables
+check_var "HF_TOKEN"
 export ip_address=$(hostname -I | awk '{print $1}')
-export HOST_IP=${ip_address}
 
-# Update proxy settings to include the host IP
-export no_proxy=${no_proxy},${ip_address}
-export http_proxy=${http_proxy}
-export https_proxy=${https_proxy}
-
-# ------------------------------------------------------------------------------
-# vLLM Service Configuration
-# ------------------------------------------------------------------------------
-
-# Port where vLLM service will be accessible
+# VLLM configuration
 export VLLM_PORT="${VLLM_PORT:-8000}"
-
-# ------------------------------------------------------------------------------
-# Language Model Configuration
-# ------------------------------------------------------------------------------
-
-# LLM model to use for the Deep Research Agent
-# See supported models and tool call parsers at:
-# https://docs.vllm.ai/en/stable/features/tool_calling/#automatic-function-calling
+export VLLM_VOLUME="${VLLM_VOLUME:-/data2/huggingface}"
+export VLLM_IMAGE="${VLLM_IMAGE:-opea/vllm-gaudi:latest}"
 export LLM_MODEL_ID="${LLM_MODEL_ID:-meta-llama/Llama-3.3-70B-Instruct}"
-
-# Parser for handling function/tool calls (must match the model)
-export TOOL_CALL_PARSER="${TOOL_CALL_PARSER:-llama3_json}"
-
-# Maximum sequence length for model context (131072 = ~128K tokens)
 export MAX_LEN="${MAX_LEN:-131072}"
-
-# Number of Gaudi accelerator cards to use
 export NUM_CARDS="${NUM_CARDS:-4}"
-
-# Directory for caching HuggingFace models
 export HF_CACHE_DIR="${HF_CACHE_DIR:-"./data"}"
+export OPENAI_BASE_URL="http://${ip_address}:8000/v1"
+export OPENAI_API_KEY="empty"
+export no_proxy=${no_proxy}
+export http_proxy=${http_proxy}
+export https_proxy=${https_proxy}
 
-# OpenAI-compatible API endpoint URL for vLLM
-export OPENAI_BASE_URL="http://${ip_address}:${VLLM_PORT}/v1"
-
-# ------------------------------------------------------------------------------
-# API Keys and Authentication
-# ------------------------------------------------------------------------------
-
-export HF_TOKEN="${HF_TOKEN}"              # HuggingFace authentication token
-export OPENAI_API_KEY="empty-api-key"      # Placeholder for vLLM compatibility
-export TAVILY_API_KEY="${TAVILY_API_KEY}"  # Tavily search API key
-
-# ------------------------------------------------------------------------------
-# Deep Research Agent Configuration
-# ------------------------------------------------------------------------------
-
-# Maximum number of research units that can run concurrently
-export MAX_CONCURRENT_RESEARCH_UNITS="${MAX_CONCURRENT_RESEARCH_UNITS:-3}"
 
-# Maximum iterations per researcher before stopping
-export MAX_RESEARCHER_ITERATIONS="${MAX_RESEARCHER_ITERATIONS:-3}"
+# Hugging Face API token
+export HF_TOKEN="${HF_TOKEN}"
 
-# Custom instructions for agent behavior (leave empty for defaults)
-export RESEARCHER_INSTRUCTIONS=""               # Instructions for individual researchers
-export RESEARCH_WORKFLOW_INSTRUCTIONS=""        # Instructions for overall research workflow
-export SUBAGENT_DELEGATION_INSTRUCTIONS=""      # Instructions for task delegation between agents
+# API keys
+check_var "TAVILY_API_KEY"
+export TAVILY_API_KEY="${TAVILY_API_KEY}"