skills/.github/workflows/skillspector.yml at 40e8397bd842f879927626e14cae76af9d7e23e1 · amd/skills · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
name: skillspector

# Statically scan skills under skills/ with SkillSpector to catch malicious
# patterns and security risks before they land on main. LLM semantic analysis
# is intentionally disabled (--no-llm): the scan is fully static, needs no API
# key, and runs in an isolated environment via uvx.
#
# To avoid re-scanning the entire catalog on every change, the discovery job
# only selects the skills that actually changed in the diff. When the scanning
# machinery itself changes (this workflow, the gate, or the allowlist) we scan
# every skill instead -- see .github/scripts/changed_skills.py.
#
# Mirrors the discover-matrix-aggregate shape of validate.yml so each skill is
# scanned independently and a single aggregate check (the `skillspector` job)
# rolls them up.
#
# This workflow is ADVISORY ONLY: SkillSpector findings never fail CI. Each
# changed skill with un-allowlisted HIGH/CRITICAL findings (or a tool error)
# raises a ::warning:: annotation plus a job-summary entry so reviewers are
# alerted that action is needed, without blocking the merge. Keep this check
# non-required in branch protection to preserve that behavior.

on:
  push:
    branches: [main]
  pull_request:
    # Keep this in sync with INFRA_PATHS in changed_skills.py: any path here
    # that isn't a skill forces a full re-scan of every skill when it changes.
    paths:
      - "skills/**"
      - ".github/workflows/skillspector.yml"
      - ".github/scripts/changed_skills.py"
      - ".github/scripts/skillspector_gate.py"
      - ".github/skillspector-allow.yml"
  workflow_dispatch:

permissions:
  contents: read

jobs:
  # Enumerate the skills the scan job should fan out over. Instead of always
  # listing every skill, select only the ones that changed relative to the
  # diff base (or all skills when the scanning machinery itself changed). The
  # resulting JSON array may be empty, in which case scan-skill is skipped.
  discover-skills:
    name: Discover skills
    runs-on: ubuntu-latest
    outputs:
      skills: ${{ steps.discover.outputs.skills }}
    steps:
      - name: Check out repository
        uses: actions/checkout@v4
        with:
          # Need history so we can diff against the base ref below.
          fetch-depth: 0

      - name: Set up uv
        uses: astral-sh/setup-uv@v7

      # On pull_request, diff against the PR base; on push, diff against the
      # commit we pushed over; otherwise (manual run) leave it empty so the
      # script falls back to scanning every skill.
      - name: Determine diff base
        id: base
        run: |
          if [ "${{ github.event_name }}" = "pull_request" ]; then
            echo "ref=${{ github.event.pull_request.base.sha }}" >> "$GITHUB_OUTPUT"
          elif [ "${{ github.event_name }}" = "push" ]; then
            echo "ref=${{ github.event.before }}" >> "$GITHUB_OUTPUT"
          else
            echo "ref=" >> "$GITHUB_OUTPUT"
          fi

      - name: Select changed skills
        id: discover
        run: echo "skills=$(uv run .github/scripts/changed_skills.py --base '${{ steps.base.outputs.ref }}')" >> "$GITHUB_OUTPUT"

  scan-skill:
    name: Scan skill
    needs: discover-skills
    runs-on: ubuntu-latest
    strategy:
      # Don't cancel the other skills when one fails; we want to see every
      # skill's scan result in a single run.
      fail-fast: false
      matrix:
        skill: ${{ fromJson(needs.discover-skills.outputs.skills) }}
    steps:
      - name: Check out repository
        uses: actions/checkout@v4

      - name: Set up uv
        uses: astral-sh/setup-uv@v7

      # Run SkillSpector pinned to a specific commit for reproducibility and
      # supply-chain safety. To bump it, update the SHA below to the desired
      # skillspector commit (e.g. `git ls-remote https://github.com/NVIDIA/skillspector.git main`).
      #
      # The CLI exits 1 when a skill's *aggregate* risk score is HIGH/CRITICAL
      # (score > 50) and 2 on error. We don't gate on the aggregate score,
      # because a pile of MEDIUM findings can push the aggregate to HIGH even
      # when no single finding is HIGH/CRITICAL. Instead we evaluate individual
      # HIGH/CRITICAL findings via the gate script.
      #
      # SkillSpector is ADVISORY ONLY: this step never fails the build. When a
      # finding (or a tool error) needs attention we raise a ::warning::
      # annotation and write to the job summary so it shows up on the PR
      # without blocking the merge. Flip the gate back to `exit 1` if you ever
      # want it to be merge-blocking again.
      - name: Scan skill with SkillSpector (advisory)
        run: |
          set +e
          mkdir -p reports
          skill="${{ matrix.skill }}"
          report="reports/${skill}.md"

          uvx --python 3.12 \
            --from "git+https://github.com/NVIDIA/skillspector.git@939da7d41eed4282e4d8217fe2254c69f690027e" \
            skillspector scan "skills/${skill}" \
              --no-llm --format markdown --output "$report"
          scan_code=$?

          echo "----- SkillSpector report: ${skill} -----"
          cat "$report" || true

          # Exit code 2 means SkillSpector itself errored; surface it as a
          # warning but don't fail the build.
          if [ "$scan_code" = "2" ]; then
            echo "::warning title=SkillSpector error::SkillSpector errored while scanning '${skill}' (exit 2) -- review needed."
            {
              echo "### :warning: ${skill}: SkillSpector errored"
              echo "SkillSpector exited 2 (tool error). Re-run the workflow or investigate the step log."
            } >> "$GITHUB_STEP_SUMMARY"
            exit 0
          fi

          # Evaluate individual HIGH/CRITICAL findings, minus documented false
          # positives in .github/skillspector-allow.yml. The gate exits 1 when
          # un-allowlisted HIGH/CRITICAL findings remain; we turn that into an
          # advisory warning rather than a failure.
          uv run .github/scripts/skillspector_gate.py \
            --report "$report" \
            --skill "${skill}" \
            --allowlist .github/skillspector-allow.yml
          gate_code=$?

          if [ "$gate_code" != "0" ]; then
            echo "::warning title=SkillSpector findings::Skill '${skill}' has un-allowlisted HIGH/CRITICAL SkillSpector findings -- action needed (advisory, not blocking)."
            {
              echo "### :warning: ${skill}: action needed"
              echo "SkillSpector flagged un-allowlisted HIGH/CRITICAL findings. Download the \`skillspector-report-${skill}\` artifact or read the step log above, then fix the skill or add a justified entry to \`.github/skillspector-allow.yml\`."
            } >> "$GITHUB_STEP_SUMMARY"
          else
            echo "### :white_check_mark: ${skill}: no un-allowlisted HIGH/CRITICAL findings" >> "$GITHUB_STEP_SUMMARY"
          fi

          # Advisory: always succeed regardless of findings.
          exit 0

      - name: Upload report
        if: always()
        uses: actions/upload-artifact@v4
        with:
          name: skillspector-report-${{ matrix.skill }}
          path: reports/${{ matrix.skill }}.md
          if-no-files-found: warn

  # Single advisory check that aggregates the per-skill matrix. SkillSpector is
  # advisory only, so findings never fail this check -- they surface as
  # ::warning:: annotations and job-summary entries on the run instead. This
  # job goes red ONLY when a scan job genuinely crashed (e.g. runner/setup
  # error), which is an infrastructure problem worth surfacing rather than a
  # skill finding. Keep this check NON-required in branch protection so the
  # advisory nature is preserved.
  #
  # Because matrix jobs run independently under `fail-fast: false`, we inspect
  # the job result explicitly rather than relying on `needs` short-circuiting.
  skillspector:
    name: SkillSpector security scan (advisory)
    needs: scan-skill
    if: always()
    runs-on: ubuntu-latest
    steps:
      - name: Summarize scan results
        run: |
          result="${{ needs.scan-skill.result }}"
          echo "scan-skill result: $result"
          # "skipped" means the matrix was empty -- no changed skills to scan.
          # "success" means every scan ran (findings, if any, were already
          # raised as warnings on those jobs). Anything else is a genuine job
          # crash, not a finding, so we surface it.
          if [ "$result" != "success" ] && [ "$result" != "skipped" ]; then
            echo "::warning title=SkillSpector scan failed to run::A SkillSpector scan job did not complete (result: $result). This is an infrastructure error, not a finding."
            echo "One or more SkillSpector scan jobs failed to run (result: $result)." >&2
            exit 1
          fi
          echo "SkillSpector scans completed. Any findings are reported as warnings on the run summary (advisory only)."