test-zeus-ai
diff --git a/‎README.md‎
Lines changed: 8 additions & 0 deletions b/‎README.md‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎agents_llm_config-example.json‎
Lines changed: 53 additions & 23 deletions b/‎agents_llm_config-example.json‎
Lines changed: 53 additions & 23 deletions
@@ -107,6 +107,7 @@ PROJECT_BASE/
 - `--llm-model LLM_MODEL`: Name of the LLM model to be used by the agent (recommended is `gpt-4o`, but it can take others).
 - `--llm-model-api-key LLM_MODEL_API_KEY`: API key for the LLM model, something like `sk-proj-k.......`.
 
+
 #### Running Hercules
 
 After passing all the required parameters, the command to run Hercules should look like this:
@@ -115,6 +116,13 @@ After passing all the required parameters, the command to run Hercules should lo
 testzeus-hercules --input-file opt/input/test.feature --output-path opt/output --test-data-path opt/test_data --llm-model gpt-4o --llm-model-api-key sk-proj-k.......
 ```
 
+#### Supported AI Models for TestZeus-Hercules
+- Anthropic Haiku: Compatible with Haiku 3.5 and above.
+- Groq: Supports any version with function calling and coding capabilities.
+- Mistral: Supports any version with function calling and coding capabilities.
+- OpenAI: Fully compatible with GPT-4o and above. Note: OpenAI GPT-4o-mini is not supported.
+- Ollama: Not supported based on current testing.
+
 #### Execution Flow
 
 Upon running the command:
 
@@ -4,22 +4,22 @@
 			"model_name": "mistral",
 			"model_api_key": "",
 			"model_base_url": "https://...",
-            "system_prompt": "You are a web automation task planner....",
             "llm_config_params": {
                 "cache_seed": null,
-                "temperature": 0.1,
-                "top_p": 0.1
+                "temperature": 0.0,
+                "top_p": 0.001,
+                "seed":12345
             }
 		},
 		"browser_nav_agent": {
 			"model_name": "mistral",
 			"model_api_key": "",
 			"model_base_url": "https://...",
-			"system_prompt": "You will perform web navigation tasks with the functions that you have...\nOnce a task is completed, confirm completion with ##TERMINATE TASK##.",
             "llm_config_params": {
                 "cache_seed": null,
-                "temperature": 0.1,
-                "top_p": 0.1
+                "temperature": 0.0,
+                "top_p": 0.001,
+                "seed":12345
             }
 		}
 	},
@@ -47,51 +47,81 @@
             }
 		}
 	},
-    "llama": {
+    "ollama": {
 		"planner_agent": {
-			"model_name": "llama-3.1-70b-versatile",
+			"model_name": "llama3-groq-tool-use",
+			"model_api_key": "",
+			"model_api_type": "ollama",
+            "model_client_host": "http://localhost:11434",
+            "model_native_tool_calls": true,
+            "model_hide_tools": "if_any_run",
+            "llm_config_params": {
+                "cache_seed": null,
+                "temperature": 0.0,
+                "top_p": 0.001,
+                "seed":12345
+            }
+		},
+		"browser_nav_agent": {
+			"model_name": "llama3-groq-tool-use",
+			"model_api_key": "",
+			"model_api_type": "ollama",
+            "model_client_host": "http://localhost:11434",
+            "model_native_tool_calls": true,
+            "model_hide_tools": "if_any_run",
+            "llm_config_params": {
+                "cache_seed": null,
+                "temperature": 0.0,
+                "top_p": 0.001,
+                "seed":12345
+            }
+		}
+    },
+    "groq": {
+		"planner_agent": {
+			"model_name": "llama3-groq-8b-8192-tool-use-preview",
 			"model_api_key": "",
 			"model_api_type": "groq",
-            "system_prompt": "You are a web automation task planner....",
             "llm_config_params": {
                 "cache_seed": null,
-                "temperature": 0.1,
-                "top_p": 0.1
+                "temperature": 0.0,
+                "top_p": 0.001,
+                "seed":12345
             }
 		},
 		"browser_nav_agent": {
-			"model_name": "llama-3.1-70b-versatile",
+			"model_name": "llama3-groq-8b-8192-tool-use-preview",
 			"model_api_key": "",
 			"model_api_type": "groq",
-			"system_prompt": "You will perform web navigation tasks with the functions that you have...\nOnce a task is completed, confirm completion with ##TERMINATE TASK##.",
             "llm_config_params": {
                 "cache_seed": null,
-                "temperature": 0.1,
-                "top_p": 0.1
+                "temperature": 0.0,
+                "top_p": 0.001,
+                "seed":12345
             }
 		}
     },
     "anthropic": {
 		"planner_agent": {
-			"model_name": "claude-3-opus-20240229",
+			"model_name": "claude-3-5-haiku-latest",
 			"model_api_key": "",
 			"model_api_type": "anthropic",
-            "system_prompt": "You are a web automation task planner....",
             "llm_config_params": {
                 "cache_seed": null,
-                "temperature": 0.1,
-                "top_p": 0.1
+                "temperature": 0.0,
+                "top_p": 0.001,
+                "seed":12345
             }
 		},
 		"browser_nav_agent": {
-			"model_name": "claude-3-opus-20240229",
+			"model_name": "claude-3-5-haiku-latest",
 			"model_api_key": "",
 			"model_api_type": "anthropic",
-			"system_prompt": "You will perform web navigation tasks with the functions that you have...\nOnce a task is completed, confirm completion with ##TERMINATE TASK##.",
             "llm_config_params": {
                 "cache_seed": null,
-                "temperature": 0.1,
-                "top_p": 0.1
+                "temperature": 0.0,
+                "top_p": 0.001,
+                "seed":12345
             }
 		}
     }