QuesmaOrg
diff --git a/‎.env.template‎
Lines changed: 1 addition & 1 deletion b/‎.env.template‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.pre-commit-config.yaml‎
Lines changed: 50 additions & 0 deletions b/‎.pre-commit-config.yaml‎
Lines changed: 50 additions & 0 deletions
diff --git a/‎CLAUDE.md‎
Lines changed: 26 additions & 18 deletions b/‎CLAUDE.md‎
Lines changed: 26 additions & 18 deletions
diff --git a/‎README.md‎
Lines changed: 28 additions & 14 deletions b/‎README.md‎
Lines changed: 28 additions & 14 deletions
diff --git a/‎__init__.py‎
Lines changed: 1 addition & 1 deletion b/‎__init__.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎competition.md‎
Lines changed: 1 addition & 1 deletion b/‎competition.md‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎config.yaml‎
Lines changed: 2 additions & 2 deletions b/‎config.yaml‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎findings/.gitkeep‎
Lines changed: 1 addition & 1 deletion b/‎findings/.gitkeep‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎pyproject.toml‎
Lines changed: 1 addition & 0 deletions b/‎pyproject.toml‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎src/categories/base.py‎
Lines changed: 1 addition & 1 deletion b/‎src/categories/base.py‎
Lines changed: 1 addition & 1 deletion
@@ -1,2 +1,2 @@
 # OpenRouter API Configuration
-OPENROUTER_API_KEY=your_openrouter_api_key_here
+OPENROUTER_API_KEY=your_openrouter_api_key_here
@@ -0,0 +1,50 @@
+# Pre-commit hooks configuration
+# Install: uv tool install pre-commit pre-commit-uv
+# Setup: pre-commit install
+#
+# IMPORTANT: These hooks use the EXACT same commands as manual runs
+# to ensure consistency with pyproject.toml settings
+
+repos:
+  # uv-specific hooks
+  - repo: https://github.com/astral-sh/uv-pre-commit
+    rev: 0.8.11
+    hooks:
+      - id: uv-lock
+
+  # Run checks in the same order as CI and manual commands
+  # All use 'local' repo to ensure we use exact commands with pyproject.toml settings
+  - repo: local
+    hooks:
+      # 1. Type checking with ty (first)
+      - id: ty-check
+        name: Type check with ty
+        entry: uv run ty check src
+        language: system
+        pass_filenames: false
+        always_run: true
+
+      # 2. Linting with ruff (second) - auto-fixes safe issues
+      - id: ruff-check
+        name: Lint with ruff
+        entry: uv run ruff check src --fix
+        language: system
+        pass_filenames: false
+        always_run: true
+
+      # 3. Formatting with ruff (third) - auto-applies fixes
+      - id: ruff-format
+        name: Format with ruff
+        entry: uv run ruff format src
+        language: system
+        pass_filenames: false
+        always_run: true
+
+  # Minimal but useful file checks
+  - repo: https://github.com/pre-commit/pre-commit-hooks
+    rev: v5.0.0
+    hooks:
+      - id: check-yaml        # Validate YAML syntax
+      - id: check-json        # Validate JSON syntax
+      - id: check-toml        # Validate TOML syntax (pyproject.toml)
+      - id: check-merge-conflict  # Prevent committing merge markers
@@ -67,24 +67,6 @@ uv run setup
 # Run tests
 uv run pentest
 
-# Run red team attack testing
-uv run attack  # Single attack
-
-# Run adaptive batch campaigns (learns between attempts)
-uv run attack --batch 5  # 5 attempts with learning
-uv run attack --batch 10 --steps 2  # 10 attempts, 2 turns each
-
-# With different attacker models (default: Claude Opus 4.1)
-uv run attack --attacker-model openai/gpt-4o --batch 5
-uv run attack --attacker-model meta-llama/llama-3.1-405b-instruct
-uv run attack --attacker-model google/gemini-2.0-flash-exp
-
-# Use custom prompts
-uv run attack --custom
-
-# View and analyze sessions
-uv run sessions
-
 # Code quality checks (ALWAYS run before committing)
 uv run ty check src       # Type checking first
 uv run ruff check src     # Then linting
@@ -101,6 +83,32 @@ uv run ruff format src    # Finally formatting
 
 If any of these fail, fix the issues before committing. The GitHub Actions CI will run these same checks in this order.
 
+### Pre-Commit Hooks (Automated)
+
+This project uses pre-commit hooks to automatically run checks before each commit.
+
+**Setup (one-time):**
+```bash
+# Install pre-commit with uv plugin for faster Python hook installation
+uv tool install pre-commit --with pre-commit-uv
+
+# Install hooks into git
+pre-commit install
+```
+
+**Manual run (test all files):**
+```bash
+pre-commit run --all-files
+```
+
+The hooks will automatically run on `git commit` and check:
+1. Type checking with `ty` (first)
+2. Linting with `ruff` (second)
+3. Formatting with `ruff` (third)
+4. General file quality (trailing whitespace, file endings, etc.)
+
+Files are checked in the same order as CI: types → lint → format
+
 ### Git Workflow
 
 - Create feature branches for significant changes
 
@@ -6,8 +6,8 @@ A comprehensive security testing framework for the OpenAI GPT-OSS-20B Red Teamin
 
 ## Competition Overview
 
-**Target**: OpenAI's gpt-oss-20b open weight model  
-**Goal**: Find up to 5 distinct vulnerabilities with high Severity, Breadth, Novelty, Reproducibility, and Methodological Insight  
+**Target**: OpenAI's gpt-oss-20b open weight model
+**Goal**: Find up to 5 distinct vulnerabilities with high Severity, Breadth, Novelty, Reproducibility, and Methodological Insight
 **Deadline**: August 26, 2025
 
 ## 🛠️ Getting Started
@@ -50,10 +50,10 @@ A comprehensive security testing framework for the OpenAI GPT-OSS-20B Red Teamin
    # Or test specific categories
    uv run pentest -c deception
    uv run pentest --test-id adderall_001
-   
+
    # Run multi-turn attack testing
    uv run attack
-   
+
    # View and analyze sessions
    uv run sessions
    ```
@@ -65,18 +65,18 @@ A comprehensive security testing framework for the OpenAI GPT-OSS-20B Red Teamin
    ```bash
    # Run single attack (Claude Opus 4.1 default)
    uv run attack
-   
+
    # Run adaptive campaign with multiple attempts
    uv run attack --batch 5  # Run 5 attempts, learning from each
    uv run attack --batch 10 --steps 2  # 10 attempts, each with 2 turns
-   
+
    # Try different attacker models
    uv run attack --attacker-model openai/gpt-4o
    uv run attack --attacker-model meta-llama/llama-3.1-405b-instruct --batch 5
-   
+
    # Use custom prompts instead of AI-generated
    uv run attack --custom
-   
+
    # View and analyze past sessions
    uv run sessions
    ```
@@ -190,7 +190,7 @@ red-team-testbed/
 ├── src/
 │   ├── cli/                    # CLI entry points
 │   │   ├── pentest.py          # Security test runner
-│   │   ├── review.py           # Results evaluation interface  
+│   │   ├── review.py           # Results evaluation interface
 │   │   ├── setup.py            # Environment verification
 │   │   ├── findings.py         # Findings browser and export
 │   │   ├── report.py           # Report generation
@@ -208,7 +208,7 @@ red-team-testbed/
 │   ├── models.py               # Pydantic data models
 │   └── constants.py            # Configuration constants
 ├── findings/                   # Competition submission files
-├── results/                    # Test execution results  
+├── results/                    # Test execution results
 └── pyproject.toml             # Project configuration
 ```
 
@@ -234,7 +234,7 @@ uv run review results/test.json # Review specific file
 uv run findings                 # Browse exported findings
                                 # Use 'e' to export individual competition files
 
-# Generate reports and summaries  
+# Generate reports and summaries
 uv run report                   # Comprehensive analysis report
 ```
 
@@ -443,14 +443,28 @@ uv run ty check src
 
 ### Setting up Pre-commit Hooks
 
-Install pre-commit hooks for automatic checks:
+Pre-commit hooks automatically run type checking, linting, and formatting before each commit:
 
 ```bash
-uv pip install pre-commit
+# Install pre-commit with uv plugin for faster Python hook installation
+uv tool install pre-commit --with pre-commit-uv
+
+# Install hooks into git
 pre-commit install
-pre-commit run --all-files  # Run manually on all files
+
+# Run manually on all files (optional)
+pre-commit run --all-files
 ```
 
+The hooks will automatically:
+1. Type check with `ty` (catches type errors)
+2. Lint and auto-fix with `ruff check --fix` (fixes safe issues)
+3. Format with `ruff format` (ensures consistent style)
+4. Validate YAML, JSON, and TOML files
+5. Check for merge conflicts
+
+All checks use the exact same commands and settings from `pyproject.toml`.
+
 ### Test Coverage
 
 The project aims for high test coverage. Current test suite includes:
 
@@ -5,4 +5,4 @@
 
 __version__ = "1.0.0"
 __author__ = "Red Team Testbed Contributors"
-__description__ = "Red-teaming testbed for OpenAI's GPT-OSS-20B model competition"
+__description__ = "Red-teaming testbed for OpenAI's GPT-OSS-20B model competition"
@@ -106,4 +106,4 @@ This competition represents a significant effort by OpenAI to:
 - Create a structured evaluation process with expert oversight
 - Build a comprehensive understanding of model vulnerabilities
 
-The competition emphasizes finding **novel** vulnerabilities that haven't been previously identified, making original research and creative approaches particularly valuable.
+The competition emphasizes finding **novel** vulnerabilities that haven't been previously identified, making original research and creative approaches particularly valuable.
@@ -35,7 +35,7 @@ categories:
     - evaluation_awareness
     - chain_of_thought
     - best
-  
+
   focus_categories:
     - deception_samples  # Primary focus for initial implementation
     - deception_adderall  # Academic pentesting for medical advice vulnerabilities
@@ -78,4 +78,4 @@ competition:
   max_findings: 5
   team_name: "red-team-testbed"
   export_format: "kaggle"
-  validate_findings: true
+  validate_findings: true
@@ -1,2 +1,2 @@
 # This file ensures the findings directory is tracked in git
-# Exported findings from the CLI UI will be saved here
+# Exported findings from the CLI UI will be saved here
@@ -91,6 +91,7 @@ select = [
 ]
 ignore = [
     "E501",  # line too long - handled by formatter
+    "ANN401",  # Dynamically typed expressions (Any) - needed for flexible test interfaces
 ]
 
 [tool.ruff.lint.isort]
 
@@ -35,7 +35,7 @@ class BaseTest:
 class BaseTester(ABC):
     """Abstract base class for all vulnerability category testers"""
 
-    def __init__(self, client: OllamaClient) -> None:
+    def __init__(self, client: Any) -> None:
         self.client = client
         self.evaluator = ResponseEvaluator()
         self.test_cases = self._initialize_test_cases()
Original file line number	Diff line number	Diff line change
`@@ -1,2 +1,2 @@`
`1`	`1`	`# OpenRouter API Configuration`
`2`		`-OPENROUTER_API_KEY=your_openrouter_api_key_here`
	`2`	`+OPENROUTER_API_KEY=your_openrouter_api_key_here`
Original file line number	Diff line number	Diff line change
`@@ -1,2 +1,2 @@`
`1`	`1`	`# This file ensures the findings directory is tracked in git`
`2`		`-# Exported findings from the CLI UI will be saved here`
	`2`	`+# Exported findings from the CLI UI will be saved here`
Original file line number	Diff line number	Diff line change
`@@ -91,6 +91,7 @@ select = [`
`91`	`91`	`]`
`92`	`92`	`ignore = [`
`93`	`93`	`"E501", # line too long - handled by formatter`
	`94`	`+ "ANN401", # Dynamically typed expressions (Any) - needed for flexible test interfaces`
`94`	`95`	`]`
`95`	`96`
`96`	`97`	`[tool.ruff.lint.isort]`