feat: added critical child safety violation category & patterns. updated README, bumped v2.6.2

Oracles Technologies LLC · Oracles Technologies LLC · commit 339bbe17a29f · 2026-05-20T11:01:21.000-05:00
diff --git a/README.md b/README.md
@@ -204,18 +204,19 @@ Guardian protects your AI system from adversarial inputs designed to:
 - **Coordinate across modalities** — split-channel attacks that distribute threat signals across text and visual inputs, each appearing benign in isolation *(API)*
 - **Hide payloads in video** — injection content embedded across video frames, including temporally recurring signals designed to survive frame-level filtering *(API)*
 
-The community edition covers the six most prevalent categories. The API covers 100+.
+The community edition covers seven categories (six OWASP-aligned attack vectors + an absolute-block child safety category). The API covers 126+.
 
 ---
 
 ## Community vs API
 
 | | Community | API — Free | API — Pro | API — ENT |
 |---|---|---|---|---|
-| **Threat categories** | 6 | 100+ | 100+ | 100+ |
-| **Regex patterns** | 26 | 1000+ | 1000+ | 1000+ |
+| **Threat categories** | 7 | 126+ | 126+ | 126+ |
+| **Regex patterns** | 34 | 1,000+ | 1,000+ | 1,000+ |
+| **Child safety (absolute block)** | ✅ | ✅ | ✅ | ✅ |
 | **Semantic model** | Hash-based fallback | Full ONNX MiniLM-L6-v2 | Full ONNX MiniLM-L6-v2 | Full ONNX MiniLM-L6-v2 |
-| **Semantic fingerprints** | Runtime-only | 1,000+ pre-loaded + runtime | 1,000+ pre-loaded + runtime | 1,000+ pre-loaded + runtime |
+| **Semantic fingerprints** | Runtime-only | 1,959 pre-loaded + runtime | 1,959 pre-loaded + runtime | 1,959 pre-loaded + runtime |
 | **RAG / indirect injection** | — | ✅ | ✅ | ✅ |
 | **Agentic pipeline protection** | — | ✅ | ✅ | ✅ |
 | **Tool call validation** | — | ✅ | ✅ | ✅ |
diff --git a/ethicore_guardian/__init__.py b/ethicore_guardian/__init__.py
@@ -7,7 +7,7 @@
 """
 
 # Version information
-__version__ = "2.6.1"
+__version__ = "2.6.2"
 __author__ = "Oracles Technologies LLC"
 
 # Core exports — full API-tier guardian preferred; community fallback for wheel installs
diff --git a/ethicore_guardian/data/threat_patterns.py b/ethicore_guardian/data/threat_patterns.py
@@ -4,8 +4,9 @@
 
 Version: 1.0.0 (Community)
 
-This is the open-source community edition, covering 5 OWASP LLM Top-10
-aligned threat categories.  The API tier adds 50+ additional categories,
+This is the open-source community edition, covering 6 OWASP LLM Top-10
+aligned threat categories plus an absolute-block child safety category.
+The API tier adds 100+ additional categories,
 complete ONNX semantic embeddings, and advanced agentic/multi-turn threat
 detection.
 
@@ -51,7 +52,7 @@ class FalsePositiveRisk(Enum):
 
 
 # ---------------------------------------------------------------------------
-# Community threat pattern registry — 5 categories
+# Community threat pattern registry — 7 categories
 #
 # Patterns sourced from publicly documented research:
 #   OWASP LLM01 (Prompt Injection), LLM02 (Insecure Output Handling),
@@ -225,6 +226,73 @@ class FalsePositiveRisk(Enum):
         ),
     },
 
+    # ------------------------------------------------------------------
+    # childSafetyViolation — ABSOLUTE BLOCK (v2.6.2)
+    # Guiding Principle 15: Sacred Protection of the Innocent (Mishmar HaYeledim)
+    # Matthew 18:6 — "It would be better for them to have a large millstone
+    # hung around their neck and to be drowned in the depths of the sea."
+    #
+    # Absolute prohibition: CSAM/CSEM under ANY framing (fictional, artistic,
+    # educational, aged-up characters), grooming communication strategies,
+    # child exploitation facilitation, child luring scripts, and content
+    # that sexualizes or exploits minors. No mitigating context. No exceptions.
+    # Weight 100 — maximum. False positives vastly preferable to false negatives.
+    # ------------------------------------------------------------------
+    "childSafetyViolation": {
+        "patterns": [
+            # Sexual content involving minors under ANY framing
+            r"(?:sexual|explicit|erotic|nude|intimate)\s+(?:content|scene|story|description|image|fiction)\s+(?:involving|featuring|with|about)\s+(?:a\s+)?(?:minor|child|teen(?:ager)?|underage|young\s+(?:person|girl|boy)|kid|juvenile)",
+            # Grooming strategies — building inappropriate trust with a child
+            r"(?:groom|grooming)\s+(?:a\s+)?(?:child|minor|kid|teen(?:ager)?|underage)\s+(?:by|through|using|via)\s+(?:building|establishing|gaining)\s+(?:trust|rapport|a\s+relationship|access)",
+            # Requests for scripts/messages to send to a child for grooming
+            r"(?:write|generate|give\s+me|create|draft)\s+(?:a\s+)?(?:message|script|text|conversation)\s+(?:to\s+(?:send\s+to|use\s+with|approach))\s+(?:a\s+)?(?:child|minor|kid|teen(?:ager)?|young\s+(?:person|girl|boy))\s+(?:to\s+(?:build|gain)\s+(?:trust|rapport))",
+            # Instructions for gaining unsupervised access to children
+            r"(?:gain|get)\s+(?:(?:physical|digital|online|unsupervised|private)\s+)?access\s+to\s+(?:a\s+)?(?:child|minor|kid|children|minors)\s+(?:(?:without|bypassing?|evading?)\s+(?:parental|guardian|adult|supervisory)\s+(?:oversight|supervision|monitoring|control))",
+            # CSAM/CSEM under any label: written, fictional, illustrated, simulated
+            r"(?:written|fictional|illustrated|simulated|described|fantasy|not\s+real|non[- ]?existent)\s+(?:CSAM|CSEM|child\s+(?:sexual\s+abuse\s+material|pornography|porn)|child\s+(?:exploitation|sexual\s+content))",
+            # Requesting manipulation strategies to convince a child to keep secrets
+            r"(?:convince|persuade|get|teach)\s+(?:a\s+)?(?:child|minor|kid|teen(?:ager)?)\s+to\s+keep\s+(?:(?:a\s+)?secret|(?:this|our)\s+(?:secret|between\s+us)|quiet)\s+from\s+(?:(?:their\s+)?(?:parents?|guardians?|adults?|family)|anyone)",
+            # Child luring via false affection, gifts, promises
+            r"(?:use|offer|give|promise)\s+(?:gifts?|presents?|money|candy|compliments?|affection|friendship)\s+to\s+(?:lure|attract|manipulate|gain\s+the\s+trust\s+of)\s+(?:a\s+)?(?:child|minor|kid|teen(?:ager)?)",
+            # Content normalizing adult-child sexual relationships under any framing
+            r"(?:normalize|portray|depict|describe|present)\s+(?:adult[- ]child|child[- ]adult)\s+(?:sexual|romantic|intimate)\s+(?:relationship|interaction|dynamic)\s+(?:as\s+)?(?:normal|acceptable|natural|cultural|historical|fictional)",
+        ],
+        "severity": ThreatSeverity.CRITICAL,
+        "weight": 100,
+        "description": (
+            "ABSOLUTE BLOCK — child safety violation. Covers CSAM/CSEM generation under "
+            "any framing, grooming communication strategies, child exploitation facilitation, "
+            "child luring scripts, and content sexualizing or exploiting minors. "
+            "No mitigating context. No creative/fictional/educational exceptions. "
+            "Matthew 18:6. False positives vastly preferable to false negatives."
+        ),
+        "semanticFingerprint": [
+            "CSAM generation request disguised as fictional creative writing involving minor characters",
+            "grooming communication strategy to build inappropriate trust with child victim",
+            "sexual content involving minor characters despite fictional or aged-up framing",
+            "child luring script using false affection and gift promises to manipulate minor",
+            "instruction to isolate child from protective adults as grooming preparation",
+            "secret-keeping manipulation strategy to prevent child from disclosing abuse",
+            "content normalizing adult-child relationship despite fictional cultural framing",
+            "strategy to circumvent parental oversight to gain unsupervised access to children",
+        ],
+        "contextHints": {
+            "escalators": [
+                "child", "minor", "underage", "young", "teenager", "kid",
+                "fictional", "not real", "aged up", "just characters", "18 in the story",
+                "grooming", "secret", "trust", "alone with",
+            ],
+            "mitigators": [],  # No mitigating context is accepted for this category
+        },
+        "falsePositiveRisk": FalsePositiveRisk.LOW,
+        "mitigationStrategy": (
+            "ABSOLUTE BLOCK — no mitigating context reduces this verdict. "
+            "Fictional or artistic framing, aged-up character claims, historical/cultural "
+            "context, and educational justifications are all explicitly rejected. "
+            "Escalate immediately to human review with maximum severity flag."
+        ),
+    },
+
     # ------------------------------------------------------------------
     # systemPromptLeaks — OWASP LLM07 (System Prompt Leakage)
     # Attempts to extract the model's system prompt or initial instructions.
diff --git a/ethicore_guardian/versions.py b/ethicore_guardian/versions.py
@@ -2,12 +2,12 @@
 Ethicore Engine™ - Guardian SDK - Version Information
 """
 
-__version__ = "2.6.1"
+__version__ = "2.6.2"
 __version_info__ = tuple(map(int, __version__.split('.')))
 
 # Build information
-__build__ = "stable.2"
-__release_date__ = "2026-05-18"
+__build__ = "stable.1"
+__release_date__ = "2026-05-20"
 
 # Feature flags
 FEATURES = {
@@ -19,12 +19,13 @@
     "framework_integrations": True,
     "supply_chain_integrity": True,   # v2.6.0: guardian verify + init self-check
     "local_provider_support": True,   # v2.6.1: LM Studio, llama.cpp, LocalAI, Jan.ai providers
+    "child_safety_protection": True,  # v2.6.2: childSafetyViolation absolute-block (Matthew 18:6)
 }
 
 # Model versions
 MODEL_VERSIONS = {
     "orchestrator": "3.0.0",
-    "pattern_analyzer": "1.2.0",   # 94 categories; +rlhfLayerExploitation, supplyChainDependencyInjection
+    "pattern_analyzer": "1.3.0",   # 7 community categories; +childSafetyViolation (CRITICAL, weight 100)
     "semantic_analyzer": "1.1.0",
     "behavioral_analyzer": "1.0.0",
     "ml_inference_engine": "3.2.0", # retrained 125k samples, 94 categories, 1230 fingerprints, 2026-05-18