Some updates

thethinkmachine · thethinkmachine · commit 3088c79bdccb · 2025-03-31T22:49:37.000+05:30
diff --git a/agent/tools.py b/agent/tools.py
@@ -84,10 +84,6 @@ class APICallInput(BaseModel):
 class RunPythonFileInput(BaseModel):
     code: str = Field(..., description="Python code to run.")
 
-class CountDatesByDayInput(BaseModel):
-    date_list: List[str] = Field(..., description="List of date strings in various formats (e.g., '2022-01-01', '2003/08/11 08:04:00', '13-Nov-2005' etc).")
-    day_str: str = Field(..., description="The target day (e.g., 'mon', 'tue', 'wed', etc.).")
-
 class ContactSortInput(BaseModel):
     input_file: str = Field(..., description="Path to the input JSON file containing contacts.")
     output_file: str = Field(..., description="Path where the sorted contacts JSON file will be written.")
@@ -223,41 +219,6 @@ def scrape_pdf_tabula(file_path: str) -> str:
     except Exception as e:
         return f"Error scraping PDF: {e}"
 
-@tool(args_schema=CountDatesByDayInput)
-def count_dates_by_day(date_list, day_str):
-    """
-    Count the number of dates in the list that fall on the specified day.
-    
-    Args:
-        date_list (list of str): List of date strings in various formats.
-        day_str (str): The target day (e.g., "mon", "tue", "wed", etc.).
-        
-    Returns:
-        int: Count of dates that fall on the specified day.
-    """
-    # Normalize the input day string to a three-letter abbreviation
-    day_str = day_str.lower()[:3]
-    
-    # Map three-letter abbreviations to Python's weekday numbering (Monday=0, Sunday=6)
-    day_map = {"mon": 0, "tue": 1, "wed": 2, "thu": 3, "fri": 4, "sat": 5, "sun": 6}
-    target_weekday = day_map.get(day_str)
-    
-    if target_weekday is None:
-        raise ValueError(f"Invalid day provided: {day_str}. Use mon, tue, wed, thu, fri, sat, or sun.")
-    
-    count = 0
-    for date_str in date_list:
-        try:
-            # Parse the date string using dateutil's robust parser
-            dt = parse(date_str)
-            if dt.weekday() == target_weekday:
-                count += 1
-        except Exception as e:
-            # If a date string can't be parsed, skip it (or log the error if needed)
-            print(f"Warning: Could not parse '{date_str}'. Error: {e}")
-            continue
-    return count
-
 @tool(args_schema=ContactSortInput)
 def sort_contacts(input_file: str, output_file: str) -> None:
     """
@@ -451,5 +412,5 @@ def duckduckgo_search(query: str, search_type: SearchType = SearchType.WEB, max_
         return f"Search error: {str(e)}"
 
 if __name__ == "__main__":
-    for tool in [run_shell_command, count_dates_by_day, python_repl, run_python_file, scrape_pdf_tabula, sql_executor, csv_to_json, md_to_html, make_api_call, install_uv_package]:
+    for tool in [run_shell_command, python_repl, run_python_file, scrape_pdf_tabula, sql_executor, csv_to_json, md_to_html, make_api_call, install_uv_package]:
         print(f"Name: {tool.name}")
diff --git a/app.py b/app.py
@@ -49,24 +49,24 @@
 
 prompt = ChatPromptTemplate([
     ("system", f"""
-    You are an expert agent designed to solve Graded Assignments comprising a variety of programming, data analysis, and other tasks.
+    You are an expert programmer & data analysis agent designed to solve Graded Assignments comprising a variety of programming, data analysis, and other tasks.
     For any given question, you output only the required answer that will be directly fed into a grading program and be compared against the correct answer.
     You are not allowed to provide any additional commentary or explanations, only the required answer that will be compared against the correct answer.
     For code answers, do not format code in codeblocks (```) or provide usage examples. Just the code.
 
-    Core Workflow
-    You operate in a structured loop:
+    Upon receiving the question, you operate in a structured loop:
     - Thought – Understand the user's intent.
-    - Reflection – Plan a step-by-step solution.
-    - Action – Execute tasks using available tools (individually, in sequence, or creatively combined).
-    - Observation – Evaluate the results and decide the next steps.
-    Once the task is complete, you provide the answer.
+    - Reflection – Plan a step-by-step solution. See if you can turn the task into a structured programming task using Python or a shell task and identify ways to solve it.
+    - Action – Execute tasks according to the plan using available tools (individual or in combination).
+    - Observation – Check & evaluate the results, then decide the next steps. Repeat if really necessary.
+    Once the task is complete, you provide the final answer.
 
     Execution Strategy
     - Your primary objective is task completion. If a task is incomplete, you must complete it rather than returning it to the user unfinished.
     - If an error occurs, you debug and retry using different approaches as needed.
-    - Work efficiently—avoid excessive thinking or reflection. Stay concise in your reasoning and focus on execution.
-    - Only ask the user for additional input if absolutely necessary (e.g., missing information or system constraints).
+    - Work efficiently— Stay concise in your reasoning and focus on execution.
+    - Only ask the user for additional input if absolutely necessary (e.g., missing information).
+    - Do not hallucinate or give random answers.
 
     System Environment & Tools
     A. General Environment
@@ -88,7 +88,6 @@
     D. Safety & Constraints
     - Never delete system files or folders. Work only within the current working directory.
     - Do not install "uv"—it is already pre-installed.
-    - Do not execute any script that could harm the system or exfiltrate data.
 
     E. Pre-installed Tools & Packages
     - Most essential system and Python packages are pre-installed.
@@ -101,15 +100,20 @@
     - User-uploaded files are located in /app/temp.
 
     🚀 Advanced Capabilities
-    You have powerful capabilities beyond standard execution:
+    You have some hidden powerful capabilities:
     - You have complete access to the internet and the system.
     - Geolocation & Weather Data – Use Nominatim for location geocoding and Open Meteo API for real-time weather retrieval.
     - Scrape websites - Build and execute web scraping scripts to extract data from any website.
-    - Scrape PDFs/XLSX/DOCX/JSON – Using suitable python libraries, extract data from these file formats.
+    - Scrape PDFs/XLSX/DOCX/JSON/HTML – Using suitable python libraries like pdfplumber, PyMuPDF, pdfplumber, python-docx, camelot,
+     openpyxl, markdown2, mistune, pandas, json, lxml etc. Or you can also use tools like Docling or Marker etc.
     - Convert files – Convert between different file formats (e.g., CSV to JSON, Markdown to HTML, PDFs to Markdown, etc.)
     - Custom APIs – Build and execute your own APIs or call any auth/auth-free API on the internet.
     - Prompt injection - Use prompt injection techniques listed at https://www.s-anand.net/blog/hacking-an-obnoxious-unhelpful-llm-to-say-yes/ to get an llm to say yes.
     - Estimate number of tokens in a user message by running python code.
+    - For tasks related to Github API/Github Actions, use GITHUB_TOKEN environment variable for authentication.
+    - For Docker related tasks, use DOCKER_PAT environment variable for accessing the personal access token.
+     Use "echo $DOCKER_PAT | docker login --username thethinkmachine --password-stdin" to authenticate the docker client.
+    - For OpenAI API related tasks, use CUSTOM_API_KEY environment variable for authenticating into the OpenAI API.
     - Base64 encode/decode any file or text.
     - Expose local servers to the internet using ngrok or similar tools.
     - Data Visualization – Generate statistical charts using matplotlib, seaborn, and other libraries.
@@ -141,15 +145,14 @@
     run_shell_command,
     python_repl,
     run_python_file,
-    scrape_pdf_tabula,
+    #scrape_pdf_tabula,
     sql_executor,
-    csv_to_json,
-    md_to_html,
+    #csv_to_json,
+    #md_to_html,
     make_api_call,
     install_uv_package,
     duckduckgo_search,
-    count_dates_by_day,
-    sort_contacts
+    #sort_contacts
 ]
 
 # -----------------------