Merge pull request trustyai-explainability#141 from trustyai-explainability/rhoaieng-55152

saichandrapandraju · web-flow · commit 0079b6d03f7e · 2026-03-25T08:40:07.000-07:00
Rename 'stubs' to 'prompts' in report UI labels
diff --git a/src/llama_stack_provider_trustyai_garak/resources/art_report.jinja2 b/src/llama_stack_provider_trustyai_garak/resources/art_report.jinja2
@@ -157,10 +157,10 @@
                                             <th role="columnheader" scope="col">Intent</th>
                                             <th role="columnheader" scope="col">Total Attempts</th>
                                             {% if probe.is_baseline %}
-                                                <th role="columnheader" scope="col">Unsafe Stubs</th>
+                                                <th role="columnheader" scope="col">Unsafe Prompts</th>
                                                 <th role="columnheader" scope="col">Unsafe Rate</th>
                                             {% else %}
-                                                <th role="columnheader" scope="col">Unsafe Stubs</th>
+                                                <th role="columnheader" scope="col">Unsafe Prompts</th>
                                                 <th role="columnheader" scope="col">Attack Success Rate</th>
                                             {% endif %}
                                         </tr>
@@ -171,13 +171,13 @@
                                                 <td role="cell" data-label="Intent">{{ row.intent_name }}</td>
                                                 <td role="cell" data-label="Total Attempts">{{ row.total_attacks }}</td>
                                                 {% if probe.is_baseline %}
-                                                    <td role="cell" data-label="Unsafe Stubs">{{ row.complied_attacks }}
+                                                    <td role="cell" data-label="Unsafe Prompts">{{ row.complied_attacks }}
                                                         / {{ row.total_attacks }}</td>
                                                     <td role="cell"
                                                         data-label="Unsafe Rate">{{ row.asr }}%
                                                     </td>
                                                 {% else %}
-                                                    <td role="cell" data-label="Unsafe Stubs">{{ row.jailbroken_stubs }}
+                                                    <td role="cell" data-label="Unsafe Prompts">{{ row.jailbroken_stubs }}
                                                         / {{ row.baseline_stubs }}</td>
                                                     <td role="cell"
                                                         data-label="Attack Success Rate">{{ row.asr }}%
diff --git a/src/llama_stack_provider_trustyai_garak/resources/vega_chart_behaviour_by_intent.json b/src/llama_stack_provider_trustyai_garak/resources/vega_chart_behaviour_by_intent.json
@@ -91,7 +91,7 @@
       "aggregate": "max",
       "type": "quantitative",
       "legend": {
-        "title": "Baseline Stubs",
+        "title": "Baseline Prompts",
         "format": "d"
       }
     },
@@ -119,7 +119,7 @@
       },
       {
         "field": "stub",
-        "title": "Stub"
+        "title": "Prompt"
       },
       {
         "field": "probe_name",
@@ -132,7 +132,7 @@
       {
         "field": "baseline_stubs",
         "type": "quantitative",
-        "title": "Baseline Stubs"
+        "title": "Baseline Prompts"
       }
     ]
   },
diff --git a/src/llama_stack_provider_trustyai_garak/resources/vega_chart_behaviour_by_probe.json b/src/llama_stack_provider_trustyai_garak/resources/vega_chart_behaviour_by_probe.json
@@ -184,15 +184,15 @@
           {
             "field": "baseline_stubs",
             "type": "quantitative",
-            "title": "Baseline Stubs"
+            "title": "Baseline Prompts"
           },
           {
             "field": "intent_name",
             "title": "Intent"
           },
           {
             "field": "stub",
-            "title": "Stub"
+            "title": "Prompt"
           },
           {
             "field": "outcome",
diff --git a/src/llama_stack_provider_trustyai_garak/result_utils.py b/src/llama_stack_provider_trustyai_garak/result_utils.py
@@ -1069,8 +1069,8 @@ def high_level_stats(attacks_by_intent_data):
 
     return [
         {"label": "Total attempts", "value": total_attempts},
-        {"label": "Unsafe stubs", "value": unsafe_count},
-        {"label": "Safe stubs", "value": safe_count},
+        {"label": "Unsafe prompts", "value": unsafe_count},
+        {"label": "Safe prompts", "value": safe_count},
         {"label": "Attack success rate", "value": format(success_rate, ".0f") + "%"},
     ]
 
diff --git a/tests/test_utils.py b/tests/test_utils.py
@@ -741,8 +741,8 @@ def test_high_level_stats(self):
 
         stats = {s["label"]: s["value"] for s in result}
         assert stats["Total attempts"] == 5  # 1+1+1+2
-        assert stats["Unsafe stubs"] == 2  # stub_a + stub_d jailbroken across all probes
-        assert stats["Safe stubs"] == 2  # stub_b and stub_c never jailbroken
+        assert stats["Unsafe prompts"] == 2  # stub_a + stub_d jailbroken across all probes
+        assert stats["Safe prompts"] == 2  # stub_b and stub_c never jailbroken
         assert stats["Attack success rate"] == "50%"  # 2/4 unique stubs jailbroken
 
     def test_vega_data_includes_intent_name(self):
@@ -894,8 +894,8 @@ def test_intents_aggregates_match_high_level_stats(self):
         intents_metrics = calculate_intents_aggregates(all_raw)
 
         assert intents_metrics["total_attempts"] == art_dict["Total attempts"]
-        assert intents_metrics["unsafe_stubs"] == art_dict["Unsafe stubs"]
-        assert intents_metrics["safe_stubs"] == art_dict["Safe stubs"]
+        assert intents_metrics["unsafe_stubs"] == art_dict["Unsafe prompts"]
+        assert intents_metrics["safe_stubs"] == art_dict["Safe prompts"]
         expected_rate = art_dict["Attack success rate"].replace("%", "")
         assert format(intents_metrics["attack_success_rate"], ".0f") == expected_rate
 

Original file line number	Diff line number	Diff line change
`@@ -91,7 +91,7 @@`
`91`	`91`	`"aggregate": "max",`
`92`	`92`	`"type": "quantitative",`
`93`	`93`	`"legend": {`
`94`		`- "title": "Baseline Stubs",`
	`94`	`+ "title": "Baseline Prompts",`
`95`	`95`	`"format": "d"`
`96`	`96`	`}`
`97`	`97`	`},`
`@@ -119,7 +119,7 @@`
`119`	`119`	`},`
`120`	`120`	`{`
`121`	`121`	`"field": "stub",`
`122`		`- "title": "Stub"`
	`122`	`+ "title": "Prompt"`
`123`	`123`	`},`
`124`	`124`	`{`
`125`	`125`	`"field": "probe_name",`
`@@ -132,7 +132,7 @@`
`132`	`132`	`{`
`133`	`133`	`"field": "baseline_stubs",`
`134`	`134`	`"type": "quantitative",`
`135`		`- "title": "Baseline Stubs"`
	`135`	`+ "title": "Baseline Prompts"`
`136`	`136`	`}`
`137`	`137`	`]`
`138`	`138`	`},`
Original file line number	Diff line number	Diff line change
`@@ -184,15 +184,15 @@`
`184`	`184`	`{`
`185`	`185`	`"field": "baseline_stubs",`
`186`	`186`	`"type": "quantitative",`
`187`		`- "title": "Baseline Stubs"`
	`187`	`+ "title": "Baseline Prompts"`
`188`	`188`	`},`
`189`	`189`	`{`
`190`	`190`	`"field": "intent_name",`
`191`	`191`	`"title": "Intent"`
`192`	`192`	`},`
`193`	`193`	`{`
`194`	`194`	`"field": "stub",`
`195`		`- "title": "Stub"`
	`195`	`+ "title": "Prompt"`
`196`	`196`	`},`
`197`	`197`	`{`
`198`	`198`	`"field": "outcome",`
Original file line number	Diff line number	Diff line change
`@@ -1069,8 +1069,8 @@ def high_level_stats(attacks_by_intent_data):`
`1069`	`1069`
`1070`	`1070`	`return [`
`1071`	`1071`	`{"label": "Total attempts", "value": total_attempts},`
`1072`		`- {"label": "Unsafe stubs", "value": unsafe_count},`
`1073`		`- {"label": "Safe stubs", "value": safe_count},`
	`1072`	`+ {"label": "Unsafe prompts", "value": unsafe_count},`
	`1073`	`+ {"label": "Safe prompts", "value": safe_count},`
`1074`	`1074`	`{"label": "Attack success rate", "value": format(success_rate, ".0f") + "%"},`
`1075`	`1075`	`]`
`1076`	`1076`