pietz
diff --git a/‎tacho/ai.py‎
Lines changed: 9 additions & 7 deletions b/‎tacho/ai.py‎
Lines changed: 9 additions & 7 deletions
diff --git a/‎tacho/config.py‎
Lines changed: 11 additions & 8 deletions b/‎tacho/config.py‎
Lines changed: 11 additions & 8 deletions
diff --git a/‎tests/conftest.py‎
Lines changed: 17 additions & 25 deletions b/‎tests/conftest.py‎
Lines changed: 17 additions & 25 deletions
diff --git a/‎tests/test_ai.py‎
Lines changed: 47 additions & 71 deletions b/‎tests/test_ai.py‎
Lines changed: 47 additions & 71 deletions
@@ -24,13 +24,15 @@ async def ping_model(model: str, console) -> bool:
 async def bench_model(model: str, max_tokens: int) -> tuple[float, int]:
     """Measure inference time for a single run and return time and tokens"""
     start_time = time.time()
-    response = await llm(model, BENCHMARK_PROMPT, max_tokens)
+    res = await llm(model, BENCHMARK_PROMPT, max_tokens)
     duration = time.time() - start_time
-    
 
-    tokens = response.usage.completion_tokens
-    if hasattr(response.usage, 'completion_tokens_details') and response.usage.completion_tokens_details:
-        if hasattr(response.usage.completion_tokens_details, 'reasoning_tokens'):
-            tokens += response.usage.completion_tokens_details.reasoning_tokens
-    
+    tokens = res.usage.completion_tokens
+    if (
+        hasattr(res.usage, "completion_tokens_details")
+        and res.usage.completion_tokens_details
+    ):
+        if hasattr(res.usage.completion_tokens_details, "reasoning_tokens"):
+            tokens += res.usage.completion_tokens_details.reasoning_tokens
+
     return duration, tokens
@@ -16,10 +16,10 @@ def ensure_env_file():
     """Create .env file with helpful comments if it doesn't exist."""
     env_path = get_env_path()
     env_dir = env_path.parent
-    
+
     # Create directory if needed
     env_dir.mkdir(exist_ok=True)
-    
+
     # Create .env file with comments if it doesn't exist
     if not env_path.exists():
         template = """# Tacho Configuration File
@@ -42,16 +42,19 @@ def ensure_env_file():
 
 """
         env_path.write_text(template)
-        
+
         # Set restrictive permissions on Unix-like systems
-        if os.name != 'nt':  # Not Windows
+        if os.name != "nt":  # Not Windows
             os.chmod(env_path, 0o600)
-        
+
         # Notify user about the created file
         from rich.console import Console
+
         console = Console()
         console.print(f"\n[yellow]Created config file at {env_path}[/yellow]")
-        console.print("Add your API keys to this file to avoid exporting them each time.\n")
+        console.print(
+            "Add your API keys to this file to avoid exporting them each time.\n"
+        )
 
 
 def configure_logging():
@@ -67,6 +70,6 @@ def load_env():
     ensure_env_file()
     env_path = get_env_path()
     load_dotenv(env_path)
-    
+
     # Also configure logging when loading env
-    configure_logging()
+    configure_logging()
@@ -1,25 +1,17 @@
-import asyncio
-from pathlib import Path
-from unittest.mock import MagicMock
-try:
-    from unittest.mock import AsyncMock
-except ImportError:
-    # Python < 3.8 compatibility
-    from mock import AsyncMock
-
+from unittest.mock import MagicMock, AsyncMock
 import pytest
 
 
 @pytest.fixture
 def mock_litellm(mocker):
     """Mock litellm.acompletion to avoid actual API calls"""
-    mock = mocker.patch('litellm.acompletion', new_callable=AsyncMock)
-    
+    mock = mocker.patch("litellm.acompletion", new_callable=AsyncMock)
+
     # Default mock response structure
     mock_response = MagicMock()
     mock_response.usage.completion_tokens = 100
     mock_response.choices = [MagicMock(message=MagicMock(content="Mock response"))]
-    
+
     mock.return_value = mock_response
     return mock
 
@@ -28,8 +20,8 @@ def mock_litellm(mocker):
 def mock_console(mocker):
     """Mock Rich console to capture output"""
     console_mock = MagicMock()
-    mocker.patch('tacho.display.console', console_mock)
-    mocker.patch('tacho.cli.console', console_mock)
+    mocker.patch("tacho.display.console", console_mock)
+    mocker.patch("tacho.cli.console", console_mock)
     # Note: tacho.ai doesn't use console directly anymore
     return console_mock
 
@@ -39,17 +31,17 @@ def temp_tacho_dir(tmp_path, mocker):
     """Create temporary .tacho directory for testing"""
     tacho_dir = tmp_path / ".tacho"
     tacho_dir.mkdir()
-    
+
     # Mock the get_env_path function to use our temp directory
-    mocker.patch('tacho.config.get_env_path', return_value=tacho_dir / ".env")
-    
+    mocker.patch("tacho.config.get_env_path", return_value=tacho_dir / ".env")
+
     return tacho_dir
 
 
 @pytest.fixture
 def mock_load_dotenv(mocker):
     """Mock dotenv loading"""
-    return mocker.patch('tacho.config.load_dotenv')
+    return mocker.patch("tacho.config.load_dotenv")
 
 
 @pytest.fixture
@@ -60,8 +52,8 @@ def mock_progress(mocker):
     progress_mock.__exit__ = MagicMock(return_value=None)
     progress_mock.add_task = MagicMock(return_value="task_id")
     progress_mock.console = MagicMock()
-    
-    mocker.patch('tacho.display.Progress', return_value=progress_mock)
+
+    mocker.patch("tacho.display.Progress", return_value=progress_mock)
     return progress_mock
 
 
@@ -70,11 +62,11 @@ def sample_benchmark_results():
     """Sample benchmark results for testing display functions"""
     return [
         (2.5, 100),  # Model 1, Run 1: 2.5s, 100 tokens
-        (2.3, 98),   # Model 1, Run 2: 2.3s, 98 tokens
+        (2.3, 98),  # Model 1, Run 2: 2.3s, 98 tokens
         (2.7, 102),  # Model 1, Run 3: 2.7s, 102 tokens
-        (1.8, 95),   # Model 2, Run 1: 1.8s, 95 tokens
-        (1.9, 97),   # Model 2, Run 2: 1.9s, 97 tokens
-        (1.7, 93),   # Model 2, Run 3: 1.7s, 93 tokens
+        (1.8, 95),  # Model 2, Run 1: 1.8s, 95 tokens
+        (1.9, 97),  # Model 2, Run 2: 1.9s, 97 tokens
+        (1.7, 93),  # Model 2, Run 3: 1.7s, 93 tokens
     ]
 
 
@@ -94,4 +86,4 @@ def mock_env_vars(monkeypatch):
 @pytest.fixture(autouse=True)
 def mock_cli_load_env(mocker):
     """Mock the load_env call in cli module to prevent file operations during import"""
-    mocker.patch('tacho.cli.load_env')
+    mocker.patch("tacho.cli.load_env")
@@ -11,73 +11,67 @@ class TestAI:
     async def test_llm_basic_call(self, mock_litellm):
         """Test basic LLM call functionality"""
         result = await llm("gpt-4", "Test prompt", 100)
-        
+
         # Verify litellm was called correctly
         mock_litellm.assert_called_once_with(
-            "gpt-4",
-            [{"role": "user", "content": "Test prompt"}],
-            max_tokens=100
+            "gpt-4", [{"role": "user", "content": "Test prompt"}], max_tokens=100
         )
-        
+
         # Verify response is returned
         assert result == mock_litellm.return_value
-    
+
     @pytest.mark.asyncio
     async def test_llm_without_max_tokens(self, mock_litellm):
         """Test LLM call without specifying max tokens"""
         await llm("gpt-4", "Test prompt")
-        
+
         mock_litellm.assert_called_once_with(
-            "gpt-4",
-            [{"role": "user", "content": "Test prompt"}],
-            max_tokens=None
+            "gpt-4", [{"role": "user", "content": "Test prompt"}], max_tokens=None
         )
-    
+
     @pytest.mark.asyncio
     async def test_ping_model_success(self, mock_litellm):
         """Test successful model ping"""
         # Create a mock console that can be used in the context
         mock_console_instance = MagicMock()
-        
+
         result = await ping_model("gpt-4", mock_console_instance)
-        
+
         # Verify success
         assert result is True
-        
+
         # Verify console output
         mock_console_instance.print.assert_called_once_with("[green]✓[/green] gpt-4")
-        
+
         # Verify LLM was called with validation prompt
         mock_litellm.assert_called_once_with(
-            "gpt-4",
-            [{"role": "user", "content": VALIDATION_PROMPT}],
-            max_tokens=1
+            "gpt-4", [{"role": "user", "content": VALIDATION_PROMPT}], max_tokens=1
         )
-    
+
     @pytest.mark.asyncio
     async def test_ping_model_failure(self, mock_litellm):
         """Test failed model ping"""
         # Configure mock to raise exception
         mock_litellm.side_effect = Exception("API Error")
         mock_console_instance = MagicMock()
-        
+
         result = await ping_model("invalid-model", mock_console_instance)
-        
+
         # Verify failure
         assert result is False
-        
+
         # Verify error output
         mock_console_instance.print.assert_called_once_with(
             "[red]✗[/red] invalid-model - API Error"
         )
-    
+
     @pytest.mark.asyncio
     async def test_bench_model_success(self, mock_litellm, mocker):
         """Test successful benchmark run"""
         # Mock time to control duration measurement
-        mock_time = mocker.patch('tacho.ai.time.time')
+        mock_time = mocker.patch("tacho.ai.time.time")
         mock_time.side_effect = [100.0, 102.5]  # 2.5 second duration
-        
+
         # Configure mock response with usage data (no reasoning tokens)
         mock_response = MagicMock()
         mock_usage = MagicMock()
@@ -86,93 +80,75 @@ async def test_bench_model_success(self, mock_litellm, mocker):
         mock_usage.completion_tokens_details = None
         mock_response.usage = mock_usage
         mock_litellm.return_value = mock_response
-        
+
         duration, tokens = await bench_model("gpt-4", 500)
-        
+
         # Verify results
         assert duration == 2.5
         assert tokens == 150
-        
+
         # Verify LLM was called correctly
         mock_litellm.assert_called_once_with(
-            "gpt-4",
-            [{"role": "user", "content": BENCHMARK_PROMPT}],
-            max_tokens=500
+            "gpt-4", [{"role": "user", "content": BENCHMARK_PROMPT}], max_tokens=500
         )
-    
-    @pytest.mark.asyncio
-    async def test_bench_model_no_usage_data(self, mock_litellm, mocker):
-        """Test benchmark when response has no usage data"""
-        # Mock time
-        mock_time = mocker.patch('tacho.ai.time.time')
-        mock_time.side_effect = [100.0, 101.0]
-        
-        # Configure mock response without usage
-        mock_response = MagicMock()
-        mock_response.usage = None
-        mock_litellm.return_value = mock_response
-        
-        duration, tokens = await bench_model("gpt-4", 500)
-        
-        # Should return 0 tokens when no usage data
-        assert duration == 1.0
-        assert tokens == 0
-    
+
     @pytest.mark.asyncio
     async def test_bench_model_exception_handling(self, mock_litellm):
         """Test that exceptions propagate from bench_model"""
         mock_litellm.side_effect = Exception("Network error")
-        
+
         with pytest.raises(Exception, match="Network error"):
             await bench_model("gpt-4", 500)
-    
+
     @pytest.mark.asyncio
     async def test_bench_model_with_reasoning_tokens(self, mock_litellm, mocker):
         """Test benchmark with reasoning models that have completion_tokens_details"""
         # Mock time
-        mock_time = mocker.patch('tacho.ai.time.time')
+        mock_time = mocker.patch("tacho.ai.time.time")
         mock_time.side_effect = [100.0, 103.0]  # 3 second duration
-        
+
         # Configure mock response with reasoning tokens
         mock_response = MagicMock()
         mock_response.usage.completion_tokens = 50  # Regular completion tokens
-        
+
         # Mock completion_tokens_details with reasoning_tokens
         mock_details = MagicMock()
         mock_details.reasoning_tokens = 200  # Reasoning tokens
         mock_response.usage.completion_tokens_details = mock_details
-        
+
         mock_litellm.return_value = mock_response
-        
+
         duration, tokens = await bench_model("o1-mini", 500)
-        
+
         # Verify results - should include both completion and reasoning tokens
         assert duration == 3.0
         assert tokens == 250  # 50 completion + 200 reasoning
-        
+
         # Verify LLM was called correctly
         mock_litellm.assert_called_once_with(
-            "o1-mini",
-            [{"role": "user", "content": BENCHMARK_PROMPT}],
-            max_tokens=500
+            "o1-mini", [{"role": "user", "content": BENCHMARK_PROMPT}], max_tokens=500
         )
-    
+
     @pytest.mark.asyncio
-    async def test_bench_model_with_empty_completion_details(self, mock_litellm, mocker):
+    async def test_bench_model_with_empty_completion_details(
+        self, mock_litellm, mocker
+    ):
         """Test benchmark when completion_tokens_details exists but has no reasoning_tokens"""
         # Mock time
-        mock_time = mocker.patch('tacho.ai.time.time')
+        mock_time = mocker.patch("tacho.ai.time.time")
         mock_time.side_effect = [100.0, 102.0]
-        
+
         # Configure mock response with completion_tokens_details but no reasoning_tokens
         mock_response = MagicMock()
         mock_response.usage.completion_tokens = 100
-        mock_response.usage.completion_tokens_details = MagicMock(spec=[])  # No reasoning_tokens attribute
-        
+        mock_response.usage.completion_tokens_details = MagicMock(
+            spec=[]
+        )  # No reasoning_tokens attribute
+
         mock_litellm.return_value = mock_response
-        
+
         duration, tokens = await bench_model("gpt-4", 500)
-        
+
         # Should only count regular completion tokens
         assert duration == 2.0
-        assert tokens == 100
+        assert tokens == 100