awslabs
diff --git a/‎README.md‎
Lines changed: 298 additions & 62 deletions b/‎README.md‎
Lines changed: 298 additions & 62 deletions
diff --git a/‎bin/cli.js‎
Lines changed: 4 additions & 3 deletions b/‎bin/cli.js‎
Lines changed: 4 additions & 3 deletions
diff --git a/‎config/parameter-schema.json‎
Lines changed: 1 addition & 1 deletion b/‎config/parameter-schema.json‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎package-lock.json‎
Lines changed: 2 additions & 2 deletions b/‎package-lock.json‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎package.json‎
Lines changed: 1 addition & 1 deletion b/‎package.json‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/app.js‎
Lines changed: 17 additions & 1 deletion b/‎src/app.js‎
Lines changed: 17 additions & 1 deletion
diff --git a/‎src/lib/auto-prompt-builder.js‎
Lines changed: 172 additions & 0 deletions b/‎src/lib/auto-prompt-builder.js‎
Lines changed: 172 additions & 0 deletions
diff --git a/‎src/lib/ci-register-helpers.js‎
Lines changed: 1 addition & 1 deletion b/‎src/lib/ci-register-helpers.js‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/lib/cli-handler.js‎
Lines changed: 1 addition & 1 deletion b/‎src/lib/cli-handler.js‎
Lines changed: 1 addition & 1 deletion
@@ -27,7 +27,8 @@ program
 
     // --- General ---
     .addOption(new Option('--skip-prompts', 'Skip interactive prompts and use configuration from other sources'))
-    .addOption(new Option('--config <path>', 'Path to configuration file'))
+    .addOption(new Option('--auto-prompt', 'Fill defaults, prompt only for missing required values'))
+    .addOption(new Option('--config <path>', 'Path to JSON configuration file'))
     .addOption(new Option('--project-name <name>', 'Project name'))
     .addOption(new Option('--project-dir <dir>', 'Output directory path'))
     .addOption(new Option('--force', 'Overwrite existing output directory without prompting'))
@@ -41,7 +42,7 @@ program
     .addOption(new Option('--base-image <image>', 'Base container image for Dockerfile'))
 
     // --- Build & Infrastructure ---
-    .addOption(new Option('--deployment-target <target>', 'Deployment target (managed-inference, async-inference, batch-transform, hyperpod-eks)'))
+    .addOption(new Option('--deployment-target <target>', 'Deployment target (realtime-inference, async-inference, batch-transform, hyperpod-eks)'))
     .addOption(new Option('--instance-type <type>', 'SageMaker instance type (e.g. ml.g5.xlarge, ml.m5.large)'))
     .addOption(new Option('--region <region>', 'AWS region'))
     .addOption(new Option('--role-arn <arn>', 'IAM role ARN for SageMaker execution'))
@@ -154,7 +155,7 @@ program.configureHelp({
 
         for (const opt of allOptions) {
             const long = opt.long || '';
-            if (['--skip-prompts', '--config', '--project-name', '--project-dir', '--force', '--version', '--help'].includes(long)) {
+            if (['--skip-prompts', '--auto-prompt', '--config', '--project-name', '--project-dir', '--force', '--version', '--help'].includes(long)) {
                 groups.general.push(opt);
             } else if (['--deployment-config', '--framework', '--model-format', '--model-name', '--model-server', '--base-image'].includes(long)) {
                 groups.model.push(opt);
 
@@ -1,7 +1,7 @@
 {
     "schemaVersion": "1.0.0",
     "deploymentTargets": {
-        "managed-inference": {
+        "realtime-inference": {
             "endpoint": {
                 "initialInstanceCount": {
                     "type": "integer",
 
@@ -1,6 +1,6 @@
 {
   "name": "@aws/ml-container-creator",
-  "version": "0.2.3",
+  "version": "0.2.4",
   "description": "Generator for SageMaker AI BYOC paradigm for predictive inference use-cases.",
   "type": "module",
   "main": "src/app.js",
 
@@ -156,6 +156,22 @@ export async function run(projectName, options) {
             console.log('   If your model package lacks an InferenceSpecification, use the S3 path');
             console.log('   directly instead: --model-name="s3://bucket/path/model.tar.gz"\n');
         }
+    } else if (configManager.isAutoPrompt()) {
+        // Auto-prompt mode: run the wizard with all resolved values pre-filled.
+        // The wizard skips prompts for values already in explicitConfig and
+        // uses phase-level gates to skip irrelevant sections entirely.
+        // This gives context-aware prompting (correct MCP queries, filtered choices)
+        // while only asking for what's truly missing.
+        console.log('\n🔄 Auto-prompt mode — prompting only for missing values with full context');
+
+        const promptRunner = new PromptRunner({
+            configManager,
+            options: kebabOptions,
+            registryConfigManager,
+            baseConfig
+        });
+        const promptAnswers = await promptRunner.run();
+        answers = configManager.getFinalConfiguration(promptAnswers);
     } else {
         const promptRunner = new PromptRunner({
             configManager,
@@ -482,7 +498,7 @@ async function _ensureTemplateVariables(answers, registryConfigManager = null) {
         testTypes: [],
         buildTimestamp: new Date().toISOString(),
         buildTarget: 'codebuild',
-        deploymentTarget: 'managed-inference',
+        deploymentTarget: 'realtime-inference',
         hyperPodCluster: null,
         hyperPodNamespace: 'default',
         hyperPodReplicas: 1,
 
@@ -0,0 +1,172 @@
+// Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.
+// SPDX-License-Identifier: Apache-2.0
+
+/**
+ * Auto-Prompt Builder — generates targeted prompts for missing required parameters.
+ * 
+ * Used by --auto-prompt mode to ask only for values that cannot be inferred
+ * or defaulted from the provided CLI flags.
+ */
+
+/**
+ * Builds a minimal set of prompts for the given missing parameters.
+ * Each prompt is self-contained and doesn't depend on multi-phase wizard state.
+ *
+ * @param {string[]} missingParams - Parameter names that need values
+ * @param {object} currentConfig - Current configuration (with defaults filled)
+ * @returns {Array} Array of prompt objects compatible with runPrompts()
+ */
+export function buildAutoPrompts(missingParams, currentConfig) {
+    const prompts = [];
+
+    for (const param of missingParams) {
+        const builder = PROMPT_BUILDERS[param];
+        if (builder) {
+            const prompt = builder(currentConfig);
+            if (prompt) {
+                prompts.push(prompt);
+            }
+        } else {
+            // Fallback: generic text input for unknown parameters
+            prompts.push({
+                type: 'input',
+                name: param,
+                message: `Enter value for ${param}:`
+            });
+        }
+    }
+
+    return prompts;
+}
+
+/**
+ * Map of parameter names to prompt builder functions.
+ * Each builder receives the current config and returns a prompt object.
+ */
+const PROMPT_BUILDERS = {
+    deploymentConfig: (_config) => ({
+        type: 'list',
+        name: 'deploymentConfig',
+        message: 'Select deployment configuration:',
+        choices: [
+            { type: 'separator', separator: '── Large Language Models ──' },
+            { name: 'Transformers with vLLM', value: 'transformers-vllm' },
+            { name: 'Transformers with SGLang', value: 'transformers-sglang' },
+            { name: 'Transformers with TensorRT-LLM', value: 'transformers-tensorrt-llm' },
+            { name: 'Transformers with LMI', value: 'transformers-lmi' },
+            { name: 'Transformers with DJL', value: 'transformers-djl' },
+            { type: 'separator', separator: '── HTTP Serving ──' },
+            { name: 'HTTP with Flask', value: 'http-flask' },
+            { name: 'HTTP with FastAPI', value: 'http-fastapi' },
+            { type: 'separator', separator: '── NVIDIA Triton ──' },
+            { name: 'Triton FIL (XGBoost, LightGBM)', value: 'triton-fil' },
+            { name: 'Triton ONNX Runtime', value: 'triton-onnxruntime' },
+            { name: 'Triton TensorFlow', value: 'triton-tensorflow' },
+            { name: 'Triton PyTorch', value: 'triton-pytorch' },
+            { name: 'Triton vLLM', value: 'triton-vllm' },
+            { name: 'Triton TensorRT-LLM', value: 'triton-tensorrtllm' },
+            { name: 'Triton Python Backend', value: 'triton-python' },
+            { type: 'separator', separator: '── Diffusion Models ──' },
+            { name: 'Diffusors with vLLM Omni', value: 'diffusors-vllm-omni' }
+        ]
+    }),
+
+    instanceType: (config) => {
+        const architecture = config.architecture || 'http';
+        const isGpu = architecture === 'transformers' || architecture === 'triton' || architecture === 'diffusors';
+
+        const gpuChoices = [
+            { name: 'ml.g5.xlarge  (1× A10G 24GB — small LLMs)', value: 'ml.g5.xlarge' },
+            { name: 'ml.g5.2xlarge (1× A10G 24GB — medium LLMs)', value: 'ml.g5.2xlarge' },
+            { name: 'ml.g5.4xlarge (1× A10G 24GB — larger models)', value: 'ml.g5.4xlarge' },
+            { name: 'ml.g5.12xlarge (4× A10G 96GB — large LLMs)', value: 'ml.g5.12xlarge' },
+            { name: 'ml.g5.48xlarge (8× A10G 192GB — very large)', value: 'ml.g5.48xlarge' },
+            { name: 'ml.g6.xlarge  (1× L4 24GB)', value: 'ml.g6.xlarge' },
+            { name: 'ml.g6.2xlarge (1× L4 24GB)', value: 'ml.g6.2xlarge' },
+            { name: 'ml.p4d.24xlarge (8× A100 320GB)', value: 'ml.p4d.24xlarge' },
+            { name: 'ml.p5.48xlarge (8× H100 640GB)', value: 'ml.p5.48xlarge' },
+            { name: 'Custom (enter manually)', value: '_custom' }
+        ];
+
+        const cpuChoices = [
+            { name: 'ml.m5.large   (2 vCPU, 8GB — lightweight)', value: 'ml.m5.large' },
+            { name: 'ml.m5.xlarge  (4 vCPU, 16GB — small models)', value: 'ml.m5.xlarge' },
+            { name: 'ml.m5.2xlarge (8 vCPU, 32GB — medium models)', value: 'ml.m5.2xlarge' },
+            { name: 'ml.m5.4xlarge (16 vCPU, 64GB — large models)', value: 'ml.m5.4xlarge' },
+            { name: 'ml.c5.xlarge  (4 vCPU, 8GB — compute-heavy)', value: 'ml.c5.xlarge' },
+            { name: 'ml.c5.2xlarge (8 vCPU, 16GB — compute-heavy)', value: 'ml.c5.2xlarge' },
+            { name: 'Custom (enter manually)', value: '_custom' }
+        ];
+
+        return {
+            type: 'list',
+            name: 'instanceType',
+            message: `Select instance type${isGpu ? ' (GPU recommended for this architecture)' : ''}:`,
+            choices: isGpu ? gpuChoices : cpuChoices
+        };
+    },
+
+    deploymentTarget: (_config) => ({
+        type: 'list',
+        name: 'deploymentTarget',
+        message: 'Select deployment target:',
+        choices: [
+            { name: 'Real-Time Inference', value: 'realtime-inference' },
+            { name: 'Async Inference', value: 'async-inference' },
+            { name: 'Batch Transform', value: 'batch-transform' },
+            { name: 'HyperPod EKS', value: 'hyperpod-eks' }
+        ]
+    }),
+
+    modelFormat: (config) => {
+        const engine = config.engine || 'sklearn';
+        const formatMap = {
+            sklearn: [
+                { name: 'pkl (pickle)', value: 'pkl' },
+                { name: 'joblib', value: 'joblib' }
+            ],
+            xgboost: [
+                { name: 'json', value: 'json' },
+                { name: 'model (binary)', value: 'model' },
+                { name: 'ubj (universal binary JSON)', value: 'ubj' }
+            ],
+            tensorflow: [
+                { name: 'keras', value: 'keras' },
+                { name: 'h5', value: 'h5' },
+                { name: 'SavedModel', value: 'SavedModel' }
+            ]
+        };
+
+        const choices = formatMap[engine] || formatMap.sklearn;
+
+        return {
+            type: 'list',
+            name: 'modelFormat',
+            message: `Select model format for ${engine}:`,
+            choices
+        };
+    },
+
+    awsRegion: (_config) => ({
+        type: 'list',
+        name: 'awsRegion',
+        message: 'Select AWS region:',
+        choices: [
+            { name: 'us-east-1 (N. Virginia)', value: 'us-east-1' },
+            { name: 'us-west-2 (Oregon)', value: 'us-west-2' },
+            { name: 'eu-west-1 (Ireland)', value: 'eu-west-1' },
+            { name: 'ap-northeast-1 (Tokyo)', value: 'ap-northeast-1' },
+            { name: 'ap-southeast-1 (Singapore)', value: 'ap-southeast-1' },
+            { name: 'Custom (enter manually)', value: '_custom' }
+        ]
+    }),
+
+    buildTarget: (_config) => ({
+        type: 'list',
+        name: 'buildTarget',
+        message: 'Select build target:',
+        choices: [
+            { name: 'CodeBuild (recommended)', value: 'codebuild' }
+        ]
+    })
+};
@@ -25,7 +25,7 @@ import { createHash } from 'node:crypto';
  * @param {string} modelName - e.g. "meta-llama/Llama-2-7b-chat-hf", defaults to "none"
  * @param {string} instanceType - e.g. "ml.g5.xlarge"
  * @param {string} region - e.g. "us-east-1"
- * @param {string} deploymentTarget - e.g. "managed-inference"
+ * @param {string} deploymentTarget - e.g. "realtime-inference"
  * @returns {string} 16-character lowercase hex string
  */
 export function computeConfigId(deploymentConfig, modelName, instanceType, region, deploymentTarget) {
 
@@ -190,7 +190,7 @@ CLI OPTIONS:
   --instance-type=<type>      SageMaker instance type (e.g., ml.m5.large, ml.g5.xlarge)
   --region=<region>           AWS region
   --role-arn=<arn>            AWS IAM role ARN for SageMaker execution
-  --deployment-target=<target> Deployment target (managed-inference|hyperpod-eks)
+  --deployment-target=<target> Deployment target (realtime-inference|async-inference|batch-transform|hyperpod-eks)
   --hyperpod-cluster=<name> HyperPod EKS cluster name
   --hyperpod-namespace=<ns> Kubernetes namespace for HyperPod (default: default)
   --hyperpod-replicas=<n>   Number of replicas for HyperPod (default: 1)
Original file line number	Diff line number	Diff line change
`@@ -1,7 +1,7 @@`
`1`	`1`	`{`
`2`	`2`	`"schemaVersion": "1.0.0",`
`3`	`3`	`"deploymentTargets": {`
`4`		`- "managed-inference": {`
	`4`	`+ "realtime-inference": {`
`5`	`5`	`"endpoint": {`
`6`	`6`	`"initialInstanceCount": {`
`7`	`7`	`"type": "integer",`
Original file line number	Diff line number	Diff line change
`@@ -1,6 +1,6 @@`
`1`	`1`	`{`
`2`	`2`	`"name": "@aws/ml-container-creator",`
`3`		`- "version": "0.2.3",`
	`3`	`+ "version": "0.2.4",`
`4`	`4`	`"description": "Generator for SageMaker AI BYOC paradigm for predictive inference use-cases.",`
`5`	`5`	`"type": "module",`
`6`	`6`	`"main": "src/app.js",`