basic-llm-agent/llm.py at main · isque03/basic-llm-agent · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
import re
from openai import OpenAI
from ollama import chat
from ollama import ChatResponse
from dotenv import load_dotenv
import os
import logging
from tools import (
    web_search,
    calculator,
    market_data,
    extract_content,
)
from abc import ABC, abstractmethod


class LLMProvider(ABC):
    """Abstract base class for LLM providers."""

    @abstractmethod
    def generate(self, messages, model=None, temperature=0.3):
        """Generate a response from the LLM given messages.

        Args:
            messages: List of message dictionaries with role and content
            model: The model to use
            temperature: Sampling temperature

        Returns:
            The generated text response
        """
        pass


class OpenAIProvider(LLMProvider):
    """OpenAI implementation of LLMProvider."""

    def __init__(self, api_key):
        self.client = OpenAI(api_key=api_key)
        self.default_model = "gpt-4o-mini"

    def generate(self, messages, model=None, temperature=0.1):
        model = model or self.default_model
        response = self.client.chat.completions.create(
            model=model,
            messages=messages,
            temperature=temperature,
        )
        return response.choices[0].message.content.strip()


class OllamaProvider(LLMProvider):
    """Ollama implementation of LLMProvider."""

    def __init__(self):
        self.default_model = "llama3.1"

    def generate(self, messages, model=None, temperature=0.2):
        model = model or self.default_model
        options = {"temperature": temperature, "max_tokens": 300}
        response = chat(model=model, messages=messages, options=options)
        # Extract content from Ollama response based on its API structure
        if isinstance(response, ChatResponse):
            return response.message.content.strip()
        return response["message"]["content"].strip()


class Agent:

    def __init__(self, provider="ollama"):
        # Load environment variables from .env file
        load_dotenv()

        # Set up logging
        logging.basicConfig(level=logging.INFO)
        logging.info("Initializing Agent with provider: %s", provider)

        # Initialize OpenAI API with the API key from environment variables
        self.api_key = os.getenv("OPENAI_API_KEY")
        if not self.api_key and provider == "openai":
            logging.error(
                "API key not found. Please set the OPENAI_API_KEY environment variable."
            )
            raise ValueError("API key is required for OpenAI provider.")

        # load prompt from system_prompt.txt
        with open("system_prompt.md", "r") as file:
            self.system_message = file.read().strip()
        self.messages = []
        self.messages.append({"role": "system", "content": self.system_message})

        # Initialize the appropriate provider
        if provider == "ollama":
            # Note smaller ollama models appear to struggle to follow system instructions
            self.llm_provider = OllamaProvider()
            self.default_model = "llama3.1"
        elif provider == "openai":
            self.llm_provider = OpenAIProvider(api_key=self.api_key)
            self.default_model = "gpt-4o-mini"
        else:
            logging.error("Unsupported provider. Use 'openai' or 'ollama'.")
            raise ValueError("Unsupported provider. Use 'openai' or 'ollama'.")

    def generate_response(self, prompt):
        """Generate a response from the LLM given a prompt."""
        try:
            self.messages.append({"role": "user", "content": str(prompt)})
            response_content = self.llm_provider.generate(
                messages=self.messages, model=self.default_model, temperature=0.3
            )
            self.messages.append({"role": "assistant", "content": response_content})
            return response_content
        except Exception as e:
            logging.error(f"Error generating response: {e}")
            return None


def extract_action(message):
    # Match either "Action: <action>" or "Action Input: <input>"
    action_regex = re.compile("^Action: (.+)$")
    action_input_regex = re.compile("^Action Input: (.+)$")

    lines = message.split("\n")
    action = None
    action_input = None
    for line in lines:
        action_match = action_regex.match(line)
        if action_match:
            action = action_match.group(1).strip()
            continue
        action_input_match = action_input_regex.match(line)
        if action_input_match:
            action_input = action_input_match.group(1).strip()
            continue
    return action, action_input


def parse_action_input_as_parameters(action_input):
    """Parse action input into args and kwargs."""
    if not action_input:
        return [], {}  # Return empty collections instead of None

    import shlex  # For proper shell-like argument parsing
    import ast
    import json

    # check if action_input contains #, if so remove it and everything after it
    if "#" in action_input:
        action_input = action_input.split("#")[0].strip()

    # Handle JSON/dictionary-like inputs
    if action_input.strip().startswith("{") and action_input.strip().endswith("}"):
        try:
            # Parse as JSON
            parsed_dict = json.loads(action_input)

            # If it's a dictionary, convert to kwargs
            if isinstance(parsed_dict, dict):
                return [], parsed_dict
        except json.JSONDecodeError:
            # If JSON parsing fails, continue with normal parsing
            pass

    # Handle special case of simple quoted string (common for web_search)
    if (
        action_input.startswith('"')
        and action_input.endswith('"')
        and action_input.count('"') == 2
    ):
        return [action_input.strip('"')], {}

    # Handle quoted strings and proper tokenization
    try:
        tokens = shlex.split(action_input)
    except ValueError:
        # Fallback if shlex parsing fails
        tokens = action_input.split()

    args = []
    kwargs = {}

    for token in tokens:
        if "=" in token:
            key, value = token.split("=", 1)
            # Try to convert string values to Python types
            try:
                value = ast.literal_eval(value)
            except (ValueError, SyntaxError):
                pass  # Keep as string if conversion fails
            kwargs[key.strip()] = value
        else:
            args.append(token)

    return args, kwargs


def extract_answer(message):
    # Match "Final Answer: <answer>" or "Answer: <answer>"
    answer_regex = re.compile("^(?:Final Answer|Answer): (.+)$")
    lines = message.split("\n")
    for line in lines:
        answer_match = answer_regex.match(line)
        if answer_match:
            return answer_match.group(1).strip()
    return None


def agent_query(user_input, max_turns=20):
    """
    Process a user query through an AI agent with a limited number of interaction turns.
    This function creates an agent instance and handles a conversation loop, allowing
    the agent to generate responses, take actions, and eventually provide an answer.
    Parameters:
    -----------
    user_input : str
      The initial query or prompt from the user.
    max_turns : int, optional
      Maximum number of back-and-forth interactions allowed (default is 15).
    Returns:
    --------
    str or None
      The extracted answer from the agent's final response if successful,
      or None if max_turns is reached without a final answer or if response generation fails.
    Notes:
    ------
    The function relies on several external components:
    - Agent class with a generate_response method
    - extract_action and extract_answer functions to parse responses
    - known_actions dictionary mapping action names to callable functions
    The conversation continues until either:
    1. The agent provides a final answer (no further actions needed)
    2. Maximum number of turns is reached
    3. Response generation fails
    """

    agent = Agent()
    num_turns = 0
    original_input = user_input  # Store the original input

    # Define thresholds for warnings
    warning_threshold = max_turns * 0.6  # Start warning at 60% of max turns
    urgent_threshold = max_turns * 0.8  # Urgent warning at 80% of max turns

    while num_turns < max_turns:
        try:
            num_turns += 1

            # Add turn count warnings as we approach the limit
            current_input = user_input

            if num_turns > urgent_threshold:
                turn_warning = f"\n\nUrgent: You are at turn {num_turns} of {max_turns}. Please provide a final answer immediately as you are about to reach the maximum allowed turns."
                current_input = user_input + turn_warning
                logging.warning(f"Urgent warning: {turn_warning}")
            elif num_turns > warning_threshold:
                turn_warning = f"\n\nNote: You are at turn {num_turns} of {max_turns}. Please start wrapping up your analysis and work toward a final answer soon."
                current_input = user_input + turn_warning
                logging.info(f"Warning: {turn_warning}")

            # Log the turn count
            logging.info(f"Agent interaction - Turn {num_turns}/{max_turns}")

            response = agent.generate_response(current_input)
            print(f"Turn {num_turns}/{max_turns}):")
            logging.info(f"=== START OF RESPONSE ===")
            logging.info(f"{response}")
            logging.info(f"=== END OF RESPONSE ===")

            if not response:
                logging.error("Failed to generate a response from the agent.")
                return None

            action, action_input = extract_action(response)
            answer = extract_answer(response)

            # Return answer if provided
            if answer:
                logging.info(f"Final answer provided after {num_turns} turns")
                return answer

            if action and action in known_actions:
                # Execute the action with the provided input
                args, kwargs = parse_action_input_as_parameters(action_input)
                try:
                    if args or kwargs:
                        result = known_actions[action](*args, **kwargs)
                    else:
                        result = known_actions[action]()
                    logging.info(
                        f"Executed tool action: '{action}' '{action_input}' with result: {str(result)}"
                    )
                    user_input = str(result)
                except Exception as e:
                    logging.error(f"Error executing action {action}: {e}")
                    user_input = f"Error executing {action}: {str(e)}"
            else:
                # If no action is specified but also no answer, remind to provide a final answer
                if not answer and num_turns > warning_threshold:
                    return "No final answer was provided. Based on the analysis so far, please provide your conclusion."
                return extract_answer(response)
        except Exception as e:
            logging.error(f"Error during agent interaction: {e}")
            user_input = f"We encountered an error: {str(e)}\n\nPlease check your tool arguments or continue solving your problem in another way."

    logging.warning(f"Max turns ({max_turns}) reached without a final answer.")
    return "Analysis exceeded maximum allowed turns. Based on the research completed, here is the current conclusion."


known_actions = {
    "web_search": web_search,
    "calculator": calculator,
    "market_data": market_data,
    "extract_content": extract_content,
}

if __name__ == "__main__":

    advanced_user_prompt = """Conduct a detailed analysis of potential stock investments as of March 2025, considering recent improvements in AI agents and thier impact on key econimic indicators. Focus on the following aspects:

    1. **Research Methodology:**
      - Utilize web search tools to identify best practices for conducting thorough company analysis.
      - Learn how to effectively evaluate company financial health, competitive positioning, and growth prospects.

    2. **Company Selection:**
      - Identify publicly traded yet unknown companies that will significantly benefit from recent advancements in AI technology.

    3. **Stock Price Trends:**
      - Collect and analyze stock price data over the past 30 days and 6 months for each selected company. Be sure you have the correct data for the time period.
      - Evaluate whether each company's stock demonstrates favorable trends for investment opportunities (e.g., upward momentum, recovery potential after decline, etc.).

    4. **Recent News and Events:**
      - Summarize recent relevant news articles or events affecting each selected company.
      - Evaluate how these events influence the company’s stock performance and investment potential.

    4. **Investment Recommendation:**
      - Determine if each stock is currently undervalued or overvalued based on the analysis.
      - Assess whether it is a favorable time to buy given current conditions and market sentiment.

    5. **Comprehensive Report:**
      - Present a detailed summary for each analyzed company, including:
        - Recent price trends
        - Impact AI advancements have on the company
        - Significant recent news
        - Final investment assessment and rationale

    5. **Web Research:**
      - Utilize credible financial news websites, market analysis platforms, and official company reports to inform your analysis.

    Provide a final summary highlighting the top recommended stocks for investment, including clear justifications based on your findings.
    """

    simple_user_prompt = (
        "What is the sum of today's high temperature in Paris and Boston?"
    )

    response = agent_query(simple_user_prompt)
    if response:
        print("Assistant:", response)
    else:
        print("Failed to generate a response.")