mgifford
diff --git a/‎.github/workflows/daily-scan.yml‎
Lines changed: 109 additions & 0 deletions b/‎.github/workflows/daily-scan.yml‎
Lines changed: 109 additions & 0 deletions
diff --git a/‎.gitignore‎
Lines changed: 2 additions & 0 deletions b/‎.gitignore‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎README.md‎
Lines changed: 69 additions & 2 deletions b/‎README.md‎
Lines changed: 69 additions & 2 deletions
diff --git a/‎docs/reports/history.json‎
Lines changed: 5 additions & 0 deletions b/‎docs/reports/history.json‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎docs/reports/index.html‎
Lines changed: 12 additions & 0 deletions b/‎docs/reports/index.html‎
Lines changed: 12 additions & 0 deletions
diff --git a/‎docs/reports/operations.md‎
Lines changed: 59 additions & 0 deletions b/‎docs/reports/operations.md‎
Lines changed: 59 additions & 0 deletions
diff --git a/‎kitty-specs/002-daily-dap-quality-benchmarking/tasks/WP01-pipeline-foundation-and-configuration.md‎
Lines changed: 27 additions & 20 deletions b/‎kitty-specs/002-daily-dap-quality-benchmarking/tasks/WP01-pipeline-foundation-and-configuration.md‎
Lines changed: 27 additions & 20 deletions
diff --git a/‎kitty-specs/002-daily-dap-quality-benchmarking/tasks/WP02-scanner-execution-layer.md‎
Lines changed: 28 additions & 21 deletions b/‎kitty-specs/002-daily-dap-quality-benchmarking/tasks/WP02-scanner-execution-layer.md‎
Lines changed: 28 additions & 21 deletions
@@ -0,0 +1,109 @@
+name: Daily DAP Scan
+
+on:
+  schedule:
+    - cron: '17 9 * * *'
+  workflow_dispatch:
+    inputs:
+      run_date:
+        description: 'Optional run date (YYYY-MM-DD)'
+        required: false
+        type: string
+      url_limit:
+        description: 'Optional URL limit override'
+        required: false
+        type: string
+      traffic_window:
+        description: 'Traffic window mode (daily|rolling_7d|rolling_30d)'
+        required: false
+        default: 'daily'
+        type: choice
+        options:
+          - daily
+          - rolling_7d
+          - rolling_30d
+      dry_run:
+        description: 'Run in dry-run mode only'
+        required: false
+        type: boolean
+        default: false
+
+permissions:
+  contents: write
+
+concurrency:
+  group: daily-dap-scan
+  cancel-in-progress: false
+
+jobs:
+  daily-scan:
+    runs-on: ubuntu-latest
+    env:
+      NODE_ENV: production
+      RUN_DATE: ${{ inputs.run_date }}
+      URL_LIMIT: ${{ inputs.url_limit }}
+      TRAFFIC_WINDOW: ${{ inputs.traffic_window || 'daily' }}
+      DRY_RUN: ${{ inputs.dry_run || false }}
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v4
+        with:
+          fetch-depth: 0
+
+      - name: Setup Node
+        uses: actions/setup-node@v4
+        with:
+          node-version: '20'
+          cache: 'npm'
+
+      - name: Install dependencies
+        run: npm ci
+
+      - name: Run tests
+        run: npm test
+
+      - name: Run pipeline
+        id: pipeline
+        shell: bash
+        run: |
+          set +e
+          ARGS=(--scan-mode mock)
+          if [[ -n "$RUN_DATE" ]]; then ARGS+=(--date "$RUN_DATE"); fi
+          if [[ -n "$URL_LIMIT" ]]; then ARGS+=(--limit "$URL_LIMIT"); fi
+          if [[ -n "$TRAFFIC_WINDOW" ]]; then ARGS+=(--traffic-window "$TRAFFIC_WINDOW"); fi
+          if [[ "$DRY_RUN" == "true" ]]; then ARGS+=(--dry-run); fi
+          node src/cli/run-daily-scan.js "${ARGS[@]}"
+          EXIT_CODE=$?
+          echo "exit_code=$EXIT_CODE" >> "$GITHUB_OUTPUT"
+          exit 0
+
+      - name: Upload diagnostics artifact
+        if: always()
+        uses: actions/upload-artifact@v4
+        with:
+          name: daily-dap-run-artifacts
+          path: |
+            artifacts/
+            docs/reports/daily/
+          if-no-files-found: warn
+
+      - name: Commit report snapshots
+        if: always() && steps.pipeline.outputs.exit_code == '0' && env.DRY_RUN != 'true'
+        shell: bash
+        run: |
+          if git diff --quiet -- docs/reports; then
+            echo "No report snapshot changes to commit."
+            exit 0
+          fi
+
+          git config user.name "github-actions[bot]"
+          git config user.email "41898282+github-actions[bot]@users.noreply.github.com"
+          git add docs/reports
+          git commit -m "chore: publish daily DAP report snapshots"
+          git push
+
+      - name: Fail workflow on pipeline error
+        if: steps.pipeline.outputs.exit_code != '0'
+        run: |
+          echo "Pipeline command exited with code ${{ steps.pipeline.outputs.exit_code }}"
+          exit 1
@@ -15,3 +15,5 @@
 .kittify/missions/__pycache__/
 __pycache__/
 *.pyc
+node_modules/
+artifacts/
@@ -1,2 +1,69 @@
-# daily-dap
-A daily scan of the Digital Accessibility Program
+# Daily DAP Quality Benchmarking
+
+Daily DAP benchmarks the quality and accessibility of the most visited U.S. government pages.
+It prioritizes high-traffic pages because regressions on those pages affect the most people seeking public services.
+
+## Why this project exists
+
+Public-facing government websites are critical infrastructure. When heavily used pages have accessibility,
+performance, or usability issues, impact is broad and immediate.
+
+This project provides a daily, repeatable quality signal by:
+
+- pulling top pages from DAP traffic data,
+- scanning those pages with Lighthouse and ScanGov,
+- aggregating quality and impact metrics,
+- publishing dated static reports and trend history.
+
+## DAP and related resources
+
+- Digital Analytics Program (DAP): https://digital.gov/guides/dap/
+- Analytics.USA.gov overview: https://analytics.usa.gov/
+- DAP data endpoint configured in this repo: `src/config/prevalence.yaml`
+- ScanGov (accessibility scanner): https://github.com/GSA/scan-gov
+- Lighthouse: https://developer.chrome.com/docs/lighthouse/overview/
+
+## Current implementation status
+
+- WP01–WP04 are implemented through report payload generation, static rendering, archive writing, and schema contract tests.
+- WP05 will finalize end-to-end CLI orchestration and scheduled CI automation for the full production run.
+
+## Expected end-to-end action (ingest → scan → report)
+
+The intended operator action is:
+
+1. Pull top DAP URLs and page-load counts.
+2. Run Lighthouse + ScanGov scans for each selected URL.
+3. Aggregate scores and accessibility impact estimates.
+4. Generate and publish dated report snapshots under `docs/reports/`.
+
+This workflow is represented by the CLI entrypoint and work package stack:
+
+- Current entrypoint scaffold: `src/cli/run-daily-scan.js`
+- Full orchestration completion target: WP05
+
+## Local development commands
+
+- Install dependencies:
+	- `npm install`
+- Run tests:
+	- `npm test`
+- Run current dry-run pipeline preview:
+	- `npm run dry-run -- --source-file tests/fixtures/dap-sample.json`
+
+## Output locations
+
+- Daily published snapshots: `docs/reports/daily/YYYY-MM-DD/`
+- History index: `docs/reports/history.json`
+- Top-level dashboard page: `docs/reports/index.html`
+
+## Project structure
+
+- `src/config/` configuration schema + prevalence inputs
+- `src/ingest/` DAP source ingestion + normalization
+- `src/scanners/` Lighthouse/ScanGov execution + normalization
+- `src/aggregation/` metrics, impact, and trends
+- `src/publish/` report building, static rendering, archive + manifest
+- `tests/unit/` unit tests
+- `tests/contract/` schema contract validation
+- `kitty-specs/002-daily-dap-quality-benchmarking/` specification and work packages
@@ -0,0 +1,5 @@
+{
+  "generated_at": null,
+  "lookback_days": 30,
+  "entries": []
+}
@@ -0,0 +1,12 @@
+<!doctype html>
+<html lang="en">
+<head>
+  <meta charset="utf-8" />
+  <meta name="viewport" content="width=device-width, initial-scale=1" />
+  <title>Daily DAP Reports</title>
+</head>
+<body>
+  <h1>Daily DAP Quality Reports</h1>
+  <p>No reports have been published yet.</p>
+</body>
+</html>
@@ -0,0 +1,59 @@
+# Daily DAP Operations Runbook
+
+## Operational goals
+
+- Keep daily report publication continuous and transparent.
+- Preserve artifact diagnostics for every run.
+- Support safe reruns and controlled rollback when publication errors occur.
+
+## Routine execution
+
+- Scheduled execution is handled by `.github/workflows/daily-scan.yml`.
+- Manual rerun is available via workflow dispatch inputs:
+  - `run_date`
+  - `url_limit`
+  - `traffic_window`
+  - `dry_run`
+
+## Local operator commands
+
+- Dry run validation:
+  - `npm run dry-run -- --source-file tests/fixtures/dap-sample.json`
+- Full mock orchestration run:
+  - `node src/cli/run-daily-scan.js --source-file tests/fixtures/dap-sample.json --scan-mode mock`
+- Run a specific date:
+  - `node src/cli/run-daily-scan.js --date 2026-02-21 --scan-mode mock --source-file tests/fixtures/dap-sample.json`
+
+## Failure handling
+
+When a run fails:
+
+- Failure payload is written to `docs/reports/daily/YYYY-MM-DD/report.json`.
+- Failure page is written to `docs/reports/daily/YYYY-MM-DD/index.html`.
+- Diagnostics summary is written to `artifacts/YYYY-MM-DD/run-summary.json`.
+- Workflow uploads the diagnostics bundle as a GitHub Actions artifact.
+
+## Recovery and rollback
+
+1. Inspect latest workflow run logs and uploaded artifact.
+2. Confirm whether failure is environmental (transient) or functional (code/data contract).
+3. For transient failures, rerun workflow dispatch for the same date.
+4. For functional issues, fix on a branch and rerun manually in dry-run mode first.
+5. If published snapshot is bad, revert only affected `docs/reports/` paths and re-run publish workflow.
+
+## Safe config changes
+
+- Edit `src/config/prevalence.yaml` for:
+  - `scan.url_limit`
+  - `scan.history_lookback_days`
+  - `scan.traffic_window_mode`
+  - impact prevalence rates and severity weights
+- Validate with:
+  - `npm test`
+  - `npm run dry-run -- --source-file tests/fixtures/dap-sample.json`
+
+## Troubleshooting notes
+
+- Scanner execution failures are expected to produce partial reports rather than silent drops.
+- Missing page-load counts are retained for diagnostics and excluded from weighted traffic math.
+- Avoid empty snapshot commits: workflow already checks for docs changes before committing.
@@ -1,26 +1,29 @@
 ---
-work_package_id: "WP01"
-subtasks:
-  - "T001"
-  - "T002"
-  - "T003"
-  - "T004"
-  - "T005"
-title: "Pipeline Foundation and Configuration"
-phase: "Phase 1 - Foundation"
-lane: "planned"
+work_package_id: WP01
+title: Pipeline Foundation and Configuration
+lane: "done"
 dependencies: []
-assignee: ""
-agent: ""
-shell_pid: ""
-review_status: ""
-reviewed_by: ""
+base_branch: main
+base_commit: 9d3d2a1568d59c415559a214ba0862a372698696
+created_at: '2026-02-21T20:15:30.629111+00:00'
+subtasks:
+- T001
+- T002
+- T003
+- T004
+- T005
+phase: Phase 1 - Foundation
+assignee: ''
+agent: "codex"
+shell_pid: "6888"
+review_status: "approved"
+reviewed_by: "Mike Gifford"
 history:
-  - timestamp: "2026-02-21T20:12:31Z"
-    lane: "planned"
-    agent: "system"
-    shell_pid: ""
-    action: "Prompt generated via /spec-kitty.tasks"
+- timestamp: '2026-02-21T20:12:31Z'
+  lane: planned
+  agent: system
+  shell_pid: ''
+  action: Prompt generated via /spec-kitty.tasks
 ---
 
 # Work Package Prompt: WP01 – Pipeline Foundation and Configuration
@@ -104,3 +107,7 @@ history:
 ## Activity Log
 
 - 2026-02-21T20:12:31Z – system – lane=planned – Prompt generated.
+- 2026-02-21T20:15:30Z – codex – shell_pid=6888 – lane=doing – Assigned agent via workflow command
+- 2026-02-21T20:29:39Z – codex – shell_pid=6888 – lane=for_review – Ready for review: foundation scaffold, config validation, ingest normalization, and tests complete
+- 2026-02-21T20:30:41Z – codex – shell_pid=6888 – lane=doing – Started review via workflow command
+- 2026-02-21T20:36:47Z – codex – shell_pid=6888 – lane=done – Review passed: WP01 foundation implemented cleanly; unit tests pass (8/8); dependency check N/A (none); dependent WP02 remains planned; dependency declarations align with current module coupling and staged architecture.
@@ -1,27 +1,30 @@
 ---
-work_package_id: "WP02"
-subtasks:
-  - "T006"
-  - "T007"
-  - "T008"
-  - "T009"
-  - "T010"
-title: "Scanner Execution Layer"
-phase: "Phase 2 - Data Collection"
-lane: "planned"
+work_package_id: WP02
+title: Scanner Execution Layer
+lane: "done"
 dependencies:
-  - "WP01"
-assignee: ""
-agent: ""
-shell_pid: ""
-review_status: ""
-reviewed_by: ""
+- WP01
+base_branch: 002-daily-dap-quality-benchmarking-WP01
+base_commit: f14ce0e83305e07ec1fbe4db2a5030cff44d6485
+created_at: '2026-02-21T20:37:59.357606+00:00'
+subtasks:
+- T006
+- T007
+- T008
+- T009
+- T010
+phase: Phase 2 - Data Collection
+assignee: ''
+agent: "codex"
+shell_pid: "3570"
+review_status: "approved"
+reviewed_by: "Mike Gifford"
 history:
-  - timestamp: "2026-02-21T20:12:31Z"
-    lane: "planned"
-    agent: "system"
-    shell_pid: ""
-    action: "Prompt generated via /spec-kitty.tasks"
+- timestamp: '2026-02-21T20:12:31Z'
+  lane: planned
+  agent: system
+  shell_pid: ''
+  action: Prompt generated via /spec-kitty.tasks
 ---
 
 # Work Package Prompt: WP02 – Scanner Execution Layer
@@ -106,3 +109,7 @@ history:
 ## Activity Log
 
 - 2026-02-21T20:12:31Z – system – lane=planned – Prompt generated.
+- 2026-02-21T20:37:59Z – codex – shell_pid=6888 – lane=doing – Assigned agent via workflow command
+- 2026-02-21T21:55:08Z – codex – shell_pid=6888 – lane=for_review – Ready for review: implemented T006-T010 scanner execution layer (Lighthouse + ScanGov runners, per-URL normalization, bounded retry/timeout execution manager, and status/diagnostics), with unit tests passing (13/13).
+- 2026-02-21T21:57:13Z – codex – shell_pid=3570 – lane=doing – Started review via workflow command
+- 2026-02-21T21:58:31Z – codex – shell_pid=3570 – lane=done – Review passed: WP02 scanner execution layer satisfies T006-T010; tests pass (13/13); dependency WP01 is on main; dependent WP03 is planned; dependency declarations match staged coupling boundaries.