amd
diff --git a/‎.claude-plugin/marketplace.json‎
Lines changed: 60 additions & 0 deletions b/‎.claude-plugin/marketplace.json‎
Lines changed: 60 additions & 0 deletions
diff --git a/‎.github/ISSUE_TEMPLATE/skill-proposal.yml‎
Lines changed: 1 addition & 1 deletion b/‎.github/ISSUE_TEMPLATE/skill-proposal.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.github/workflows/import-external-skills.yml‎
Lines changed: 103 additions & 0 deletions b/‎.github/workflows/import-external-skills.yml‎
Lines changed: 103 additions & 0 deletions
diff --git a/‎CONTRIBUTING.md‎
Lines changed: 2 additions & 2 deletions b/‎CONTRIBUTING.md‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎README.md‎
Lines changed: 19 additions & 11 deletions b/‎README.md‎
Lines changed: 19 additions & 11 deletions
@@ -8,12 +8,36 @@
     "version": "0.1.0"
   },
   "plugins": [
+    {
+      "name": "aiter-reflection",
+      "source": "./skills/aiter-reflection",
+      "skills": "./",
+      "description": "This skill should be used when optimizing AMD GPU kernels on MI300 using the aiter project, including running op tests, benchmarking, iterating on kernel changes, and recording results in the kernel experiment database."
+    },
     {
       "name": "apu-memory-tuner",
       "source": "./skills/apu-memory-tuner",
       "skills": "./",
       "description": "Inspect and tune the shared-vs-dedicated memory split (GTT / UMA Frame Buffer) on AMD Ryzen APUs so larger LLMs and image models fit on the iGPU."
     },
+    {
+      "name": "gpu-architecture-fundamentals",
+      "source": "./skills/gpu-architecture-fundamentals",
+      "skills": "./",
+      "description": "This skill should be used when reasoning about GPU architecture fundamentals to guide kernel optimization choices such as memory hierarchy usage, execution model mapping, block sizing, and latency-aware tuning across HIP, Triton, and PyTorch."
+    },
+    {
+      "name": "hip-kernel-optimization",
+      "source": "./skills/hip-kernel-optimization",
+      "skills": "./",
+      "description": "This skill should be used when writing or tuning HIP kernels on AMD/NVIDIA GPUs, covering memory coalescing, shared-memory tiling, bank conflict avoidance, warp primitives, occupancy, vectorization, async ops, loop unrolling, and profiling."
+    },
+    {
+      "name": "kernel-exp-history",
+      "source": "./skills/kernel-exp-history",
+      "skills": "./",
+      "description": "This skill should be used when optimizing kernels in this repo and needing to consult past optimization experiments, or when recording the current optimization iteration back into the kernel experiment database."
+    },
     {
       "name": "local-ai-app-integration",
       "source": "./skills/local-ai-app-integration",
@@ -26,11 +50,47 @@
       "skills": "./",
       "description": "Route image generation, text-to-speech, and speech-to-text through a local AI Server to reduce token/cost usage."
     },
+    {
+      "name": "mi300-hip-programming-insights",
+      "source": "./skills/mi300-hip-programming-insights",
+      "skills": "./",
+      "description": "CDNA3/MI300 HIP programming insights—chiplet/cache model, Infinity Cache, memory coherency, matrix cores, sparsity, and best practices."
+    },
+    {
+      "name": "pytorch-kernel-optimization",
+      "source": "./skills/pytorch-kernel-optimization",
+      "skills": "./",
+      "description": "This skill should be used when optimizing PyTorch models and kernels, including efficient tensor operations, torch.compile, custom autograd/CUDA/Triton extensions, mixed precision, memory and data pipeline tuning, model optimization techniques, CUDA graphs, and profiling."
+    },
     {
       "name": "rocm-doctor",
       "source": "./skills/rocm-doctor",
       "skills": "./",
       "description": "Diagnose why ROCm, PyTorch, or llama.cpp isn't working on an AMD GPU. Matches the symptom against a fixed list of twelve known misconfigurations and proposes the next step."
+    },
+    {
+      "name": "rocprof-compute",
+      "source": "./skills/rocprof-compute",
+      "skills": "./",
+      "description": "This skill should be used when profiling AMD GPU kernels with rocprof-compute to collect metrics, roofline data, and analyze bottlenecks for HIP kernels."
+    },
+    {
+      "name": "triton-hip-reference-kernel-search",
+      "source": "./skills/triton-hip-reference-kernel-search",
+      "skills": "./",
+      "description": "Search and adapt Triton/HIP kernel patterns from a corpus to optimize AMD GPUs; use to find similar ops and reuse tiling/occupancy strategies."
+    },
+    {
+      "name": "triton-kernel-optimization",
+      "source": "./skills/triton-kernel-optimization",
+      "skills": "./",
+      "description": "This skill should be used when writing or tuning Triton GPU kernels, including autotuning block sizes, coalesced accesses, tiled matmul, fused ops, reductions, flash-attention style kernels, quantization, custom gradients, and profiling."
+    },
+    {
+      "name": "triton-kernel-reflection-prompts",
+      "source": "./skills/triton-kernel-reflection-prompts",
+      "skills": "./",
+      "description": "Reflection/self-critique prompts for reviewing and fixing AMD-targeted Triton kernels after generation or test failures."
     }
   ]
 }
@@ -50,7 +50,7 @@ body:
     id: home
     attributes:
       label: Where should this skill live?
-      description: See the two contribution paths in `CONTRIBUTING.md`. Path A skills are authored under `skills/` in this repo; Path B skills live in a product repo and are registered here via `catalog/`.
+      description: See the two contribution paths in `CONTRIBUTING.md`. Path A skills are authored under `skills/` in this repo; Path B skills live in a product repo and are registered here via `scripts/sources.yml`.
       options:
         - "Path A: incubated in this repo (may move to a product repo and continbue to be registered here)"
         - "Path B: authored in a product repo (HIP, ROCm, Ryzen AI, Lemonade, ...) and registered here"
 
@@ -0,0 +1,103 @@
+name: import-external-skills
+
+# Manually-dispatched workflow that refreshes the federated portion of the
+# catalog. It reads `scripts/sources.yml`, shallow-clones each declared
+# source, vendors the named skills into `skills/<name>/`, updates
+# `.claude-plugin/marketplace.json`, regenerates the Cursor manifest, and
+# opens a pull request with the result. Every imported skill goes through
+# the same `validate` checks as in-repo skills before it lands on `main`.
+#
+# See the "A federated catalog" section of `README.md` for the design.
+
+on:
+  workflow_dispatch:
+    inputs:
+      dry_run:
+        description: "Resolve sources and print planned changes without committing."
+        required: false
+        type: boolean
+        default: false
+
+permissions:
+  contents: write
+  pull-requests: write
+
+concurrency:
+  group: import-external-skills
+  cancel-in-progress: false
+
+jobs:
+  import:
+    name: Import external skills
+    runs-on: ubuntu-latest
+    steps:
+      - name: Check out repository
+        uses: actions/checkout@v4
+
+      - name: Set up uv
+        uses: astral-sh/setup-uv@v7
+
+      - name: Configure git for sparse-checkout
+        run: |
+          git --version
+          git config --global init.defaultBranch main
+
+      - name: Import skills declared in scripts/sources.yml
+        id: import
+        run: |
+          if [ "${{ inputs.dry_run }}" = "true" ]; then
+            uv run scripts/import_external_skills.py --dry-run
+          else
+            uv run scripts/import_external_skills.py
+          fi
+
+      - name: Regenerate Cursor plugin manifest
+        if: ${{ inputs.dry_run != true }}
+        run: uv run scripts/generate_cursor_plugin.py
+
+      - name: Validate skills and manifests
+        if: ${{ inputs.dry_run != true }}
+        run: ./scripts/check.sh
+
+      - name: Detect changes
+        if: ${{ inputs.dry_run != true }}
+        id: changes
+        run: |
+          if [ -z "$(git status --porcelain)" ]; then
+            echo "changed=false" >> "$GITHUB_OUTPUT"
+            echo "No changes to import. Skipping PR."
+          else
+            echo "changed=true" >> "$GITHUB_OUTPUT"
+            git status --short
+          fi
+
+      # Use the GitHub-maintained action to push to a dedicated branch and
+      # open a PR. PRs (rather than direct commits to main) keep imported
+      # changes reviewable and let the standard `validate` workflow gate
+      # them.
+      - name: Open pull request with imported skills
+        if: ${{ inputs.dry_run != true && steps.changes.outputs.changed == 'true' }}
+        uses: peter-evans/create-pull-request@v7
+        with:
+          branch: bot/import-external-skills
+          delete-branch: true
+          commit-message: "chore(catalog): refresh federated skills from scripts/sources.yml"
+          title: "Refresh federated skills"
+          body: |
+            Automated import driven by `scripts/sources.yml`.
+
+            See the "A federated catalog" section of `README.md` for the
+            design. Each vendored skill includes a `.federated.json` marker
+            recording the source repo, pinned ref, and resolved commit at
+            import time.
+
+            Triggered by @${{ github.actor }} via the `import-external-skills`
+            workflow ([run](${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }})).
+          labels: |
+            catalog
+            automated
+          add-paths: |
+            scripts/sources.yml
+            skills/**
+            .claude-plugin/**
+            .cursor-plugin/**
@@ -33,8 +33,8 @@ Best for cross-cutting skills that do not have a natural product home.
 Best for skills that should ship and version with a product (HIP, MIGraphX, Ryzen AI, Lemonade, etc.).
 
 1. Add the skill folder to your product repository; a common location is `.agents/skills/<skill-name>/`.
-2. Open a pull request here that adds an entry to `catalog/` pointing at the skill's location and pinning a tag.
-3. CI will validate the linked skill against the same rules as in-repo skills, and the central plugin manifests will surface it through one install.
+2. Open a pull request here that adds (or extends) an entry in [`scripts/sources.yml`](scripts/sources.yml) — the master list — naming your repo, a pinned ref, the sub-path that holds skill folders, and your skill's folder name.
+3. Once the catalog change merges, dispatch the **Import external skills** workflow from the Actions tab. It shallow-clones your repo at the pinned ref, vendors the skill into `skills/<name>/`, updates `.claude-plugin/marketplace.json`, and opens a follow-up pull request. Validation then runs against the same rules as in-repo skills before merge.
 
 ## Is this task a good fit for a skill?
 
 
@@ -107,8 +107,8 @@ So skills here are **federated**: each skill is owned and versioned by the team
                 ┌─────────────────────────────────────────────────────┐
                 │                amd/skills (this repo)               │
                 │                                                     │
-                │   skills/         catalog/         .*-plugin/       │
-                │   in-repo skills  pointers         agent manifests  │
+                │   skills/         scripts/         .*-plugin/      │
+                │   in-repo skills  sources.yml       agent manifests │
                 └──────────────────────┬──────────────────────────────┘
                                        │  one install
                                        ▼
@@ -124,7 +124,7 @@ So skills here are **federated**: each skill is owned and versioned by the team
 
 Each skill stays close to the engineers who ship the underlying product, the CI that validates it, and the release tag that pins it.
 
-This repo also acts as an **incubator**: a skill can start its life under `skills/` here to iterate quickly, then graduate to its product repo and be re-pointed from `catalog/` once it has a clear owner, with no change for installed users.
+This repo also acts as an **incubator**: a skill can start its life under `skills/` here to iterate quickly, then graduate to its product repo and be re-pointed from `scripts/sources.yml` once it has a clear owner, with no change for installed users.
 
 ### What this means for you
 
@@ -135,21 +135,29 @@ This repo also acts as an **incubator**: a skill can start its life under `skill
 ### What this means if you contribute
 
 - **In-repo skills** (Path A) are best for cross-cutting workflows that do not have a natural product home.
-- **Product-repo skills** (Path B) are best for skills that should live and version with a specific product. You add the skill folder to your product repo and open a small PR here that registers it in `catalog/` with a pinned tag. CI validates the linked skill against the same rules as in-repo skills, and the central plugin manifests surface it through the same one install.
+- **Product-repo skills** (Path B) are best for skills that should live and version with a specific product. You add the skill folder to your product repo and open a small PR here that registers it in `scripts/sources.yml` with a pinned tag. CI validates the linked skill against the same rules as in-repo skills, and the central plugin manifests surface it through the same one install.
 
 See [CONTRIBUTING.md](CONTRIBUTING.md) for the step-by-step contribution flow for each path.
 
 ### Repository layout
 
 ```
-skills/             # Skills authored in this repository
-catalog/            # Manifest pointers to skills that live in product repositories
-.cursor-plugin/     # Cursor plugin manifest
-.claude-plugin/     # Claude Code marketplace manifest
-.github/workflows/  # CI for validating skills and manifests
-scripts/            # Tooling for publishing and regenerating manifests
+skills/                  # All skills the agent can load (in-repo + vendored copies of federated)
+.cursor-plugin/          # Cursor plugin manifest
+.claude-plugin/          # Claude Code marketplace manifest
+.github/workflows/       # CI for validating skills and the `import-external-skills` workflow
+scripts/                 # Tooling for publishing, regenerating manifests, and importing
+scripts/sources.yml      # Master list of external skill sources for federation
 ```
 
+In-repo skills are authored directly under `skills/`. Federated skills are
+declared in [`scripts/sources.yml`](scripts/sources.yml) and vendored into
+`skills/` by the manually-dispatched `import-external-skills` workflow,
+which opens a pull request with the imported copies. Each vendored skill
+carries a `.federated.json` marker that records the upstream repo and
+pinned commit, so the importer can refresh or remove it without disturbing
+in-repo skills.
+
 ## Manual Installation
 
 AMD Skills are compatible with Cursor, Claude Code, OpenAI Codex, and Gemini CLI. The general flow:
@@ -194,7 +202,7 @@ The agent loads the matching `SKILL.md` and any helper scripts, then carries out
 We welcome contributions from AMD engineers and selected partners. There are two paths, matching how the catalog is organized:
 
 - **Path A: In-repo skills.** Authored directly under `skills/` in this repository. Best for cross-cutting workflows that do not have a natural product home.
-- **Path B: Product-repo skills.** Authored in a product repository and registered here through `catalog/` with a pinned tag. Best for skills that should ship and version with a specific product (HIP, ROCm, Ryzen AI, Lemonade, etc.).
+- **Path B: Product-repo skills.** Authored in a product repository and registered here through `scripts/sources.yml` with a pinned tag. Best for skills that should ship and version with a specific product (HIP, ROCm, Ryzen AI, Lemonade, etc.).
 
 See [CONTRIBUTING.md](CONTRIBUTING.md) for step-by-step instructions, the full authoring guide, and the rules CI enforces on every pull request.