up

mitchross · mitchross · commit 277ae9d3b47d · 2026-02-24T01:21:25.000-05:00
diff --git a/docs/vpa-resource-optimization.md b/docs/vpa-resource-optimization.md
@@ -2,6 +2,60 @@
 
 How to use VPA, Goldilocks, and Kyverno to right-size Kubernetes resource requests based on actual workload behavior.
 
+## TL;DR — Just Tell Me What To Do
+
+**Everything is automatic.** VPA is already watching every workload in the cluster. You don't need to set anything up.
+
+### Step 1: Open the dashboard
+
+Go to **https://goldilocks.vanillax.me** in your browser (must be on LAN/VPN).
+
+### Step 2: Pick a namespace
+
+Click any namespace (e.g., `argocd`, `immich`, `home-assistant`). You'll see every workload with its current resource settings and what VPA recommends.
+
+### Step 3: Look for problems
+
+The dashboard shows color-coded recommendations. Look for:
+- **Current request way below "Target"** = pod is starved, increase it
+- **Current request way above "Target"** = wasting resources, decrease it
+- **Current request below "Lower Bound"** = pod is actively throttled, fix ASAP
+
+### Step 4: Apply changes
+
+Edit the app's `values.yaml` in Git, update the `resources:` block, push, ArgoCD applies it. Add a comment explaining why:
+
+```yaml
+# VPA-optimized (2026-02-24) — target was 2000m, previous 500m
+resources:
+  requests:
+    cpu: 2000m
+    memory: 1Gi
+```
+
+### Step 5: Wait and re-check
+
+VPA recommendations update continuously. Check back in a week to see if the new values are good. Don't change things daily.
+
+### Quick script to see all recommendations
+
+```bash
+# Full report with human-readable values and action guidance
+./scripts/vpa-report.sh
+
+# Filter to one namespace
+./scripts/vpa-report.sh argocd
+
+# Or raw kubectl one-liner
+kubectl get vpa -A -o custom-columns=\
+NS:.metadata.namespace,\
+NAME:.metadata.name,\
+CPU:.status.recommendation.containerRecommendations[0].target.cpu,\
+MEM:.status.recommendation.containerRecommendations[0].target.memory
+```
+
+---
+
 ## The Toolchain
 
 | Tool | What It Does | Location |
diff --git a/scripts/vpa-report.sh b/scripts/vpa-report.sh
@@ -0,0 +1,127 @@
+#!/bin/bash
+# vpa-report.sh — Show VPA recommendations vs current resource requests
+# Usage: ./scripts/vpa-report.sh [namespace]
+# If no namespace given, shows all namespaces
+
+set -euo pipefail
+
+NS_FLAG=""
+if [[ "${1:-}" != "" ]]; then
+  NS_FLAG="-n $1"
+else
+  NS_FLAG="-A"
+fi
+
+echo "=========================================="
+echo "  VPA Resource Recommendations Report"
+echo "=========================================="
+echo ""
+
+# Get all VPAs with recommendations
+kubectl get vpa $NS_FLAG -o json 2>/dev/null | python3 -c "
+import json, sys
+
+def bytes_to_human(b):
+    \"\"\"Convert bytes string to human-readable.\"\"\"
+    try:
+        n = int(b)
+    except (ValueError, TypeError):
+        return str(b)
+    if n >= 1073741824:
+        return f'{n/1073741824:.1f}Gi'
+    elif n >= 1048576:
+        return f'{n/1048576:.0f}Mi'
+    elif n >= 1024:
+        return f'{n/1024:.0f}Ki'
+    return str(n)
+
+def cpu_to_milli(cpu):
+    \"\"\"Normalize CPU to millicores string.\"\"\"
+    if cpu is None:
+        return '?'
+    s = str(cpu)
+    if s.endswith('m'):
+        return s
+    try:
+        return f'{int(float(s) * 1000)}m'
+    except ValueError:
+        return s
+
+data = json.load(sys.stdin)
+items = data.get('items', [])
+
+if not items:
+    print('No VPA resources found.')
+    sys.exit(0)
+
+# Collect results
+results = []
+for vpa in items:
+    ns = vpa['metadata']['namespace']
+    name = vpa['metadata']['name']
+    target_ref = vpa.get('spec', {}).get('targetRef', {})
+    target_kind = target_ref.get('kind', '?')
+    target_name = target_ref.get('name', '?')
+
+    recs = vpa.get('status', {}).get('recommendation', {}).get('containerRecommendations', [])
+    if not recs:
+        results.append({
+            'ns': ns, 'name': name, 'kind': target_kind,
+            'container': '-', 'cpu_target': 'waiting...', 'mem_target': 'waiting...',
+            'cpu_lower': '-', 'cpu_upper': '-',
+            'mem_lower': '-', 'mem_upper': '-',
+        })
+        continue
+
+    for rec in recs:
+        target = rec.get('target', {})
+        lower = rec.get('lowerBound', {})
+        upper = rec.get('upperBound', {})
+        results.append({
+            'ns': ns,
+            'name': name,
+            'kind': target_kind,
+            'container': rec.get('containerName', '?'),
+            'cpu_target': cpu_to_milli(target.get('cpu')),
+            'mem_target': bytes_to_human(target.get('memory', '?')),
+            'cpu_lower': cpu_to_milli(lower.get('cpu')),
+            'cpu_upper': cpu_to_milli(upper.get('cpu')),
+            'mem_lower': bytes_to_human(lower.get('memory', '?')),
+            'mem_upper': bytes_to_human(upper.get('memory', '?')),
+        })
+
+# Print table
+fmt = '{:<20} {:<35} {:<25} {:>10} {:>10} {:>10} {:>10}'
+print(fmt.format('NAMESPACE', 'WORKLOAD', 'CONTAINER', 'CPU TGT', 'CPU RANGE', 'MEM TGT', 'MEM RANGE'))
+print('-' * 145)
+
+# Sort by namespace then name
+results.sort(key=lambda r: (r['ns'], r['name']))
+
+for r in results:
+    cpu_range = f'{r[\"cpu_lower\"]}-{r[\"cpu_upper\"]}'
+    mem_range = f'{r[\"mem_lower\"]}-{r[\"mem_upper\"]}'
+    print(fmt.format(
+        r['ns'][:20],
+        f'{r[\"kind\"]}/{r[\"name\"]}'[:35],
+        r['container'][:25],
+        r['cpu_target'],
+        cpu_range[:10],
+        r['mem_target'],
+        mem_range[:10],
+    ))
+
+print()
+print(f'Total: {len(results)} containers with VPA recommendations')
+print()
+print('Legend:')
+print('  CPU TGT  = recommended CPU request (millicores)')
+print('  MEM TGT  = recommended memory request')
+print('  RANGE    = lowerBound-upperBound')
+print()
+print('Action needed if your current request is:')
+print('  < lowerBound  →  INCREASE NOW (pod is being throttled)')
+print('  < target      →  INCREASE (under-provisioned)')
+print('  ≈ target      →  KEEP (well-tuned)')
+print('  > 2x target   →  DECREASE (over-provisioned)')
+"