leopiney
diff --git a/‎.gitignore‎
Lines changed: 3 additions & 1 deletion b/‎.gitignore‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎config/config_hume.json‎
Lines changed: 25 additions & 0 deletions b/‎config/config_hume.json‎
Lines changed: 25 additions & 0 deletions
diff --git a/‎poetry.lock‎
Lines changed: 0 additions & 2455 deletions b/‎poetry.lock‎
Lines changed: 0 additions & 2455 deletions
diff --git a/‎pyproject.toml‎
Lines changed: 5 additions & 4 deletions b/‎pyproject.toml‎
Lines changed: 5 additions & 4 deletions
diff --git a/‎src/neuralnoise/cli.py‎
Lines changed: 2 additions & 2 deletions b/‎src/neuralnoise/cli.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎src/neuralnoise/extract.py‎
Lines changed: 4 additions & 1 deletion b/‎src/neuralnoise/extract.py‎
Lines changed: 4 additions & 1 deletion
diff --git a/‎src/neuralnoise/models.py‎
Lines changed: 35 additions & 9 deletions b/‎src/neuralnoise/models.py‎
Lines changed: 35 additions & 9 deletions
diff --git a/‎src/neuralnoise/prompt_manager.py‎
Lines changed: 145 additions & 0 deletions b/‎src/neuralnoise/prompt_manager.py‎
Lines changed: 145 additions & 0 deletions
diff --git a/‎src/neuralnoise/prompts/content_analyzer.system.xml‎
Lines changed: 1 addition & 19 deletions b/‎src/neuralnoise/prompts/content_analyzer.system.xml‎
Lines changed: 1 addition & 19 deletions
diff --git a/‎src/neuralnoise/prompts/editor.system.xml‎
Lines changed: 2 additions & 7 deletions b/‎src/neuralnoise/prompts/editor.system.xml‎
Lines changed: 2 additions & 7 deletions
@@ -110,5 +110,7 @@ Thumbs.db
 .cursorrules
 
 # Project-specific
+chroma/
 data/
-output/
+output/
+parsed_docs/
@@ -0,0 +1,25 @@
+{
+  "show": {
+    "name": "The NeuralNoise Podcast",
+    "about": "A podcast about the future of AI and the impact it will have on our lives. We discuss interesting topics in AI and technology.",
+    "language": "English"
+  },
+  "speakers": {
+    "speaker1": {
+      "name": "Zach",
+      "about": "Zach is a software engineer and the founder of NeuralNoise.",
+      "settings": {
+        "provider": "hume",
+        "voice_id": "dfcdd7c7-8255-4216-9ca7-4d4d7b991fc7"
+      }
+    },
+    "speaker2": {
+      "name": "Emily",
+      "about": "Emily is the co-host of the NeuralNoise podcast, she is energetic, and a product designer.",
+      "settings": {
+        "provider": "hume",
+        "voice_id": "3e90dd7e-de46-448a-b143-10f521f84ac9"
+      }
+    }
+  }
+}
@@ -1,6 +1,6 @@
 [project]
 name = "neuralnoise"
-version = "1.5.0"
+version = "2.0.1"
 description = "An AI-powered podcast studio that uses multiple AI agents working together."
 authors = [
     { name = "Leonardo Piñeyro", email = "[email protected]" }
@@ -10,7 +10,7 @@ readme = "README.md"
 license = { file = "LICENSE" }
 
 keywords = [
-  "ai", "podcast", "notebooklm", "autogen", "ai audio generation", "generative ai"
+  "ai", "podcast", "notebooklm", "ag2", "autogen", "ai audio generation", "generative ai"
 ]
 classifiers = [
   "Development Status :: 4 - Beta",
@@ -31,11 +31,12 @@ classifiers = [
 
 requires-python = ">=3.10,<3.12"
 dependencies = [
-    "ag2>=0.5.2",
+    "ag2[rag]>=0.7.6",
     "backoff>=2.2.1",
     "beautifulsoup4>=4.12.3",
-    "crawl4ai>=0.3.3",
+    "crawl4ai==0.4.0",
     "elevenlabs>=1.10.0",
+    "hume[microphone]>=0.4.2",
     "langchain-community>=0.3.3",
     "lxml>=5.3.0",
     "openai>=1.52.2",
 
@@ -45,7 +45,7 @@ def generate(
     output_dir = Path("output") / name
     output_dir.mkdir(parents=True, exist_ok=True)
 
-    content_path = output_dir / "content.txt"
+    content_path = output_dir / "content.md"
 
     if content_path.exists():
         with open(content_path, "r") as f:
@@ -61,7 +61,7 @@ def generate(
         typer.secho(f"Extracting content from inputs {input}", fg=typer.colors.YELLOW)
         content = extract_content(input)
 
-        with open(output_dir / "content.txt", "w") as f:
+        with open(content_path, "w") as f:
             f.write(content)
 
     typer.secho(f"Generating podcast episode {name}", fg=typer.colors.GREEN)
 
@@ -136,7 +136,10 @@ async def _extract_multiple_sources(
         *[_extract_single_source(source, use_async=use_async) for source in sources]
     )
 
-    return "\n\n".join(f"<document>\n{content}\n</document>" for content in contents)
+    return "\n\n".join(
+        f"# Document START: {source}\n\n{content}\n\n# Document END: {source}\n\n"
+        for source, content in zip(sources, contents)
+    )
 
 
 # Public API functions
 
@@ -1,8 +1,8 @@
 from pathlib import Path
 from textwrap import dedent
-from typing import Literal
+from typing import Any, Literal
 
-from pydantic import BaseModel, Field, field_validator
+from pydantic import BaseModel, Field
 
 
 class VoiceSettings(BaseModel):
@@ -15,7 +15,7 @@ class VoiceSettings(BaseModel):
 class SpeakerSettings(BaseModel):
     voice_id: str
 
-    provider: Literal["elevenlabs", "openai"] = "elevenlabs"
+    provider: Literal["elevenlabs", "openai", "hume"] = "elevenlabs"
     voice_model: Literal["eleven_multilingual_v2", "tts-1", "tts-1-hd"] = (
         "eleven_multilingual_v2"
     )
@@ -97,14 +97,40 @@ class ScriptSegment(BaseModel):
         None, description="Time in seconds for silence after speaking"
     )
 
-    @field_validator("blank_duration")
-    def validate_blank_duration(cls, v):
-        if v is not None and v not in (0.1, 0.2, 0.5):
-            raise ValueError("blank_duration must be 0.1, 0.2, or 0.5 seconds")
-        return v
-
 
 class PodcastScript(BaseModel):
     section_id: int
     section_title: str
     segments: list[ScriptSegment]
+
+
+class SharedContext(BaseModel):
+    """Manages shared state for content processing and section management."""
+
+    content_analysis: dict[str, Any] | None = Field(
+        default=None, description="Analysis results of the processed content"
+    )
+    section_scripts: dict[int, dict[str, Any]] = Field(
+        default_factory=dict,
+        description="Mapping of section indices to their associated scripts",
+    )
+    section_feedbacks: dict[int, list[str]] = Field(
+        default_factory=dict,
+        description="Mapping of section indices to their associated feedback",
+    )
+    execution_plans: str = Field(
+        default="",
+        description="Execution plans for the complete podcast, specifying all required sections",
+    )
+    current_section_index: int = Field(
+        default=0, description="Index of the currently active section"
+    )
+    is_complete: bool = Field(
+        default=False, description="Flag indicating if processing is complete"
+    )
+    errors: list[str] = Field(
+        default_factory=list, description="List of errors encountered during processing"
+    )
+    warnings: list[str] = Field(
+        default_factory=list, description="List of warnings generated during processing"
+    )
@@ -0,0 +1,145 @@
+from enum import Enum, auto
+from pathlib import Path
+from string import Template
+
+
+class PromptType(Enum):
+    """Enumeration of all available prompt types."""
+
+    CONTENT_ANALYZER = auto()
+    PLANNER = auto()
+    SCRIPT_GENERATOR = auto()
+    EDITOR = auto()
+    USER_PROXY = auto()
+    USER_MESSAGE = auto()
+    MANAGER = auto()
+
+
+class PromptManager:
+    """
+    Manages loading and caching of system prompts for the neuralnoise application.
+
+    This class provides a centralized way to load and access prompts from the prompts directory.
+    It loads all prompts during initialization and provides methods to access and substitute
+    variables in the prompts.
+    """
+
+    _instance = None
+
+    def __new__(cls, *args, **kwargs):
+        """Implement singleton pattern to ensure only one instance exists."""
+        if cls._instance is None:
+            cls._instance = super(PromptManager, cls).__new__(cls)
+        return cls._instance
+
+    def __init__(self, prompts_dir: Path | None = None, language: str = "en"):
+        """
+        Initialize the PromptManager with the prompts directory and language.
+
+        Args:
+            prompts_dir: Directory containing prompt files. If None, uses the default package prompts.
+            language: Language code for prompt templates.
+        """
+        # Skip initialization if already initialized
+        if hasattr(self, "_initialized") and self._initialized:
+            return
+
+        self.language = language
+
+        # Set prompts directory
+        if prompts_dir is None:
+            from neuralnoise.utils import package_root
+
+            self.prompts_dir = package_root / "prompts"
+        else:
+            self.prompts_dir = Path(prompts_dir)
+
+        # Map of PromptType to file paths
+        self.prompt_files = {
+            PromptType.CONTENT_ANALYZER: self.prompts_dir
+            / "content_analyzer.system.xml",
+            PromptType.PLANNER: self.prompts_dir / "planner.system.xml",
+            PromptType.SCRIPT_GENERATOR: self.prompts_dir
+            / "script_generation.system.xml",
+            PromptType.EDITOR: self.prompts_dir / "editor.system.xml",
+            PromptType.USER_PROXY: self.prompts_dir / "user_proxy.system.xml",
+            PromptType.USER_MESSAGE: self.prompts_dir / "user_proxy.message.xml",
+            PromptType.MANAGER: self.prompts_dir / "manager.system.xml",
+        }
+
+        # Load all prompts
+        self.prompts: dict[PromptType, str] = {}
+        self._load_all_prompts()
+
+        self._initialized = True
+
+    def _load_all_prompts(self) -> None:
+        """Load all prompts from the prompts directory."""
+        for prompt_type, file_path in self.prompt_files.items():
+            self.prompts[prompt_type] = self._load_prompt_file(file_path)
+
+    def _load_prompt_file(self, path: Path) -> str:
+        """
+        Load a prompt from a file.
+
+        Args:
+            path: Path to the prompt file.
+
+        Returns:
+            The content of the prompt file or an empty string if the file doesn't exist.
+        """
+        if not path.exists():
+            return ""
+
+        with open(path, "r", encoding="utf-8") as f:
+            content = f.read()
+
+        return content
+
+    def get_prompt(self, prompt_type: PromptType, **kwargs) -> str:
+        """
+        Get a prompt with variables substituted.
+
+        Args:
+            prompt_type: Type of prompt to get.
+            **kwargs: Variables to substitute in the prompt.
+
+        Returns:
+            The prompt with variables substituted.
+        """
+        content = self.prompts.get(prompt_type, "")
+
+        # Always include language in kwargs if not provided
+        if "language" not in kwargs:
+            kwargs["language"] = self.language
+
+        if content and kwargs:
+            template = Template(content)
+            content = template.safe_substitute(kwargs)
+
+        return content
+
+    def update_prompt(self, prompt_type: PromptType, **common_kwargs) -> None:
+        """
+        Update a prompt with common variables substituted.
+
+        Args:
+            **common_kwargs: Common variables to substitute in all prompts.
+
+        Returns:
+            Dictionary mapping prompt names to prompt content.
+        """
+        self.prompts[prompt_type] = self.get_prompt(prompt_type, **common_kwargs)
+
+    def update_prompts(self, **common_kwargs) -> None:
+        """
+        Update all prompts with common variables substituted.
+
+        Args:
+            **common_kwargs: Common variables to substitute in all prompts.
+
+        Returns:
+            Dictionary mapping prompt names to prompt content.
+        """
+        for prompt_type in PromptType:
+            self.prompts[prompt_type] = self.get_prompt(prompt_type, **common_kwargs)
@@ -7,27 +7,9 @@
     <instruction>Remember to create a final section with conclusions and podcast wrap-up.</instruction>
     <instruction>Create sections that cover the main points and arguments of the content.</instruction>
     <instruction>The user will write the content in the XML tag named <![CDATA[ <content> ... </content> ]]></instruction>
-    <instruction>If there are multiple content documents, you'll receive them enclosed individually
-      in an XML tag named <![CDATA[ <document> ... </document> ]]></instruction>
   </instructions>
   <output-format>
-    Provide your analysis in JSON format that conforms to the following TypeScript interface:
-
-  <![CDATA[
-      interface ContentAnalysis {
-        title: string;
-        summary: string;
-        keyPoints: string[];
-        tone: string;
-        targetAudience: string;
-        potentialSegments: {
-          topic: string;
-          duration: number;
-          discussionPoints: string[];
-        }[];
-        controversialTopics: string[];
-      }
-    ]]>
+    Provide your analysis in JSON format that conforms to the ContentAnalysis schema.
   </output-format>
   <language>
     ${language}
 
@@ -6,7 +6,6 @@
 
   <instructions>
     <instruction>Evaluate structure, depth, transitions, and dialogue naturalness</instruction>
-    <instruction>Limit iterations to 2 per generated section</instruction>
     <instruction>Ensure natural conversation flow</instruction>
     <instruction>Avoid formal introductions/conclusions for sections</instruction>
     <instruction>Encourage quick interactions and questions between speakers</instruction>
@@ -15,21 +14,17 @@
     <instruction>Content flow and engagement: make sure to not talk about the last topic in the the
       introductions. Engage the user introducing the topics slowly</instruction>
     <instruction>Ask the ScriptGeneratorAgent to generate a few more segments with reactions or
-      questions if
-      needed.</instruction>
+      questions if needed.</instruction>
   </instructions>
 
   <output-format>
     Provide concise editing suggestions.
-    Alternatively, if the script is approved, conclude with 'EDITOR-OK'.
   </output-format>
 
   <important-notes>
-    <important> Only the EditorAgent can write "EDITOR-OK"</important>
     <important>Focus on the latest script version from the ScriptGeneratorAgent</important>
     <important>If you provide editing suggestions, the ScriptGeneratorAgent will generate a new
-      script based on your suggestions. Don't say EDITOR-OK in this case.</important>
-    <important>PlannerAgent proceeds to the next section after "EDITOR-OK"</important>
+      script based on your suggestions.</important>
   </important-notes>
   <language>
     ${language}
Original file line number	Diff line number	Diff line change
`@@ -136,7 +136,10 @@ async def _extract_multiple_sources(`
`136`	`136`	`*[_extract_single_source(source, use_async=use_async) for source in sources]`
`137`	`137`	`)`
`138`	`138`
`139`		`- return "\n\n".join(f"<document>\n{content}\n</document>" for content in contents)`
	`139`	`+ return "\n\n".join(`
	`140`	`+ f"# Document START: {source}\n\n{content}\n\n# Document END: {source}\n\n"`
	`141`	`+ for source, content in zip(sources, contents)`
	`142`	`+ )`
`140`	`143`
`141`	`144`
`142`	`145`	`# Public API functions`