KasarLabs
diff --git a/‎.gitignore‎
Lines changed: 3 additions & 0 deletions b/‎.gitignore‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎.smithers/agents.ts‎
Lines changed: 32 additions & 0 deletions b/‎.smithers/agents.ts‎
Lines changed: 32 additions & 0 deletions
diff --git a/‎.smithers/config.ts‎
Lines changed: 8 additions & 0 deletions b/‎.smithers/config.ts‎
Lines changed: 8 additions & 0 deletions
diff --git a/‎.smithers/preload.ts‎
Lines changed: 2 additions & 0 deletions b/‎.smithers/preload.ts‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎.smithers/prompts/final-review.mdx‎
Lines changed: 38 additions & 0 deletions b/‎.smithers/prompts/final-review.mdx‎
Lines changed: 38 additions & 0 deletions
diff --git a/‎.smithers/prompts/plan.mdx‎
Lines changed: 32 additions & 0 deletions b/‎.smithers/prompts/plan.mdx‎
Lines changed: 32 additions & 0 deletions
diff --git a/‎.smithers/prompts/review.mdx‎
Lines changed: 44 additions & 0 deletions b/‎.smithers/prompts/review.mdx‎
Lines changed: 44 additions & 0 deletions
diff --git a/‎.smithers/schemas.ts‎
Lines changed: 55 additions & 0 deletions b/‎.smithers/schemas.ts‎
Lines changed: 55 additions & 0 deletions
diff --git a/‎.smithers/workflow.db‎
-172 KB b/‎.smithers/workflow.db‎
-172 KB
diff --git a/‎.smithers/workflow.db-shm‎
32 KB b/‎.smithers/workflow.db-shm‎
32 KB
@@ -51,3 +51,6 @@ fixtures/runner_crate/target
 .snfoundry_cache
 
 python/starklings_results/
+
+
+smithers.db*
@@ -0,0 +1,32 @@
+import { ClaudeCodeAgent, CodexAgent } from "smithers-orchestrator";
+import { REPO_ROOT } from "./config";
+
+const SYSTEM_PROMPT_BASE = `You are working on Cairo Coder, a RAG-based Cairo code generation service.
+Stack: Python/FastAPI backend, DSPy for LLM orchestration, PostgreSQL/pgvector.
+Package manager: uv (NEVER pip/poetry).
+Read CLAUDE.md for full project conventions before making any changes.
+
+CRITICAL OUTPUT REQUIREMENT:
+When you have completed your work, you MUST end your response with a JSON object
+wrapped in a code fence. The JSON format is specified in your task prompt.`;
+
+export const planner = new ClaudeCodeAgent({
+  model: "opus",
+  systemPrompt: SYSTEM_PROMPT_BASE,
+  cwd: REPO_ROOT,
+  permissionMode: "default",
+});
+
+export const implementer = new CodexAgent({
+  model: "gpt-5.3-codex",
+  dangerouslyBypassApprovalsAndSandbox: true,
+  systemPrompt: SYSTEM_PROMPT_BASE,
+  cwd: REPO_ROOT,
+});
+
+export const reviewer = new ClaudeCodeAgent({
+  model: "opus",
+  systemPrompt: SYSTEM_PROMPT_BASE,
+  cwd: REPO_ROOT,
+  permissionMode: "default",
+});
@@ -0,0 +1,8 @@
+export const MAX_PASSES = 5;
+
+export const REPO_ROOT = process.cwd();
+
+export const VERIFICATION_COMMANDS = {
+  test: "cd python && uv run pytest -v",
+  lint: "trunk check --fix",
+} as const;
@@ -0,0 +1,2 @@
+import { mdxPlugin } from "smithers-orchestrator/mdx-plugin";
+mdxPlugin();
@@ -0,0 +1,38 @@
+# Final Review — STRICT GATE — Pass {props.pass}
+
+You are the final quality gate. REFUSE to approve unless ALL criteria are met.
+
+## Completed Tasks
+
+{props.completedTasks || "None"}
+
+## Latest Review
+
+{props.latestReview ?? "No review yet"}
+
+## Verification
+
+Run ALL checks:
+
+```bash
+cd python && uv run pytest -v
+trunk check --fix
+```
+
+## Criteria — ALL must pass
+
+- [ ] ALL tests pass (`uv run pytest` exits 0)
+- [ ] ALL lint/type checks pass (`trunk check` exits 0)
+- [ ] Implementation matches SPEC.md requirements
+- [ ] No dead code left behind (old McpGenerationProgram removed if replaced)
+- [ ] New code has unit tests
+- [ ] DSPy patterns followed correctly
+- [ ] No hardcoded paths or credentials
+
+Set `readyToMoveOn: true` ONLY if you genuinely cannot find ANYTHING to improve.
+
+If `readyToMoveOn: false`, explain exactly what must be fixed — this feeds into the next pass's implement step.
+
+## REQUIRED OUTPUT
+
+{props.schema}
@@ -0,0 +1,32 @@
+# Plan — Pass {props.pass}
+
+You are a senior Python/DSPy architect. Read the spec and examine the codebase to plan the next atomic unit of work.
+
+## Context
+
+- **Spec file:** {props.specPath}
+- **Completed tasks:** {props.completedTasks || "None yet"}
+- **Codebase areas:** `python/src/cairo_coder/dspy/`, `python/src/cairo_coder/core/`, `python/tests/`
+
+{props.previousFeedback ? `## Feedback from Previous Pass\n${props.previousFeedback}` : ""}
+
+## Instructions
+
+1. Read CLAUDE.md for project conventions
+2. Read the spec at {props.specPath}
+3. Examine the codebase — especially the files mentioned in the spec
+4. Identify the NEXT smallest atomic unit of work (one signature, one module, one test file). Balance properly so as not to pick tasks too small or too large: organize logically for reviewers.
+5. Research what exists and what needs to change
+6. Write a detailed implementation prompt
+
+If the SPEC mentions _CRITICAL_ or _REORIENTATION_ or _STEERING_ sections, make sure to follow them; make sure those tasks are prioritized. This is what we are using to steer to the right direction.
+
+## Constraints
+
+- Pick ONE atomic unit, not the entire feature
+- The implementation prompt must be specific enough for another agent to execute without ambiguity
+- List exact file paths for files to create/modify
+
+## REQUIRED OUTPUT
+
+{props.schema}
@@ -0,0 +1,44 @@
+# Review — Pass {props.pass}
+
+You are a senior code reviewer for Cairo Coder, a Python/FastAPI/DSPy project.
+
+## What Changed
+
+**Task:** {props.taskName}
+**Summary:** {props.summary}
+**Files changed:** {JSON.stringify(props.filesChanged ?? [])}
+**Test output:** {props.testOutput ?? "No test output provided"}
+
+## Instructions
+
+1. Read CLAUDE.md for project conventions
+2. Read ALL changed files listed above — do not review blindly
+3. Run verification checks in order:
+
+```bash
+cd python && uv run pytest -v
+trunk check --fix
+```
+
+4. Check for:
+   - Correct DSPy patterns (Signature → Module → factory function)
+   - Type hints on all functions
+   - No hardcoded paths
+   - No duplicated fixtures (all shared fixtures in `tests/conftest.py`)
+   - Async/await for I/O operations
+   - Proper structlog usage
+
+## Decision
+
+Set `lgtm: true` ONLY if:
+
+- ALL tests pass
+- ALL lint/type checks pass
+- Code follows CLAUDE.md conventions
+- No security issues (OWASP top 10)
+
+If ANY check fails, set `lgtm: false` and list every specific issue.
+
+## REQUIRED OUTPUT
+
+{props.schema}
@@ -0,0 +1,55 @@
+import { z } from "zod";
+
+export const PlanSchema = z.object({
+  taskName: z.string().describe("Name of the next task to implement"),
+  research: z
+    .string()
+    .describe("What was discovered by examining the codebase"),
+  implementationPrompt: z
+    .string()
+    .describe("Detailed prompt for the implementer"),
+  filesToCreate: z.array(z.string()).describe("Files that need to be created"),
+  filesToModify: z.array(z.string()).describe("Files that need to be modified"),
+  nextSmallestUnit: z
+    .string()
+    .nullable()
+    .describe("Next smallest atomic unit after this task"),
+});
+
+export const ImplementSchema = z.object({
+  summary: z.string().describe("What was implemented"),
+  filesChanged: z
+    .array(z.string())
+    .describe("Files that were created or modified"),
+  testOutput: z.string().describe("Output from running pytest"),
+  commitMessage: z.string().describe("Git commit message for this change"),
+  nextSmallestUnit: z
+    .string()
+    .nullable()
+    .describe("Next smallest atomic unit to implement"),
+});
+
+export const ReviewSchema = z.object({
+  lgtm: z.boolean().describe("true ONLY if ALL checks pass"),
+  review: z.string().describe("Summary of the review findings"),
+  issues: z.array(z.string()).describe("Specific issues found"),
+});
+
+export const FixSchema = z.object({
+  summary: z.string().describe("What was fixed"),
+  filesChanged: z.array(z.string()).describe("Files that were modified"),
+});
+
+export const FinalReviewSchema = z.object({
+  readyToMoveOn: z.boolean().describe("true ONLY if all criteria met"),
+  reasoning: z
+    .string()
+    .describe("Why ready or not ready — feeds back into next pass"),
+  qualityScore: z.number().min(1).max(10).describe("Overall quality score"),
+});
+
+export const PassTrackerSchema = z.object({
+  totalIterations: z.number(),
+  tasksCompleted: z.array(z.string()),
+  summary: z.string(),
+});
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,2 @@`
	`1`	`+import { mdxPlugin } from "smithers-orchestrator/mdx-plugin";`
	`2`	`+mdxPlugin();`