SocioProphet · mdheller · May 5, 2026 · May 7, 2026 · May 7, 2026 · May 7, 2026
diff --git a/ai-infra/AGENT_HARNESS_RISK_CONTROLS.md b/ai-infra/AGENT_HARNESS_RISK_CONTROLS.md
@@ -0,0 +1,242 @@
+# Agent Harness Risk Controls
+
+Status: v0.1 planning baseline  
+Owner plane: SCOPE-D defensive validation  
+Consumers: Delivery Excellence, Policy Fabric, AgentPlane, Memory Mesh, SourceOS, BearBrowser, TurtleTerm, SocioSphere
+
+## Purpose
+
+The Aden/Hive production-agent pattern introduces reusable skills, MCP servers, browser automation, terminal actions, memory writeback, generated graphs, judge loops, and evolution patches. SCOPE-D owns the defensive validation lane for those capability surfaces.
+
+This document defines the risk-control surface that turns agent harness risk into measurable delivery/security evidence.
+
+## Boundary
+
+SCOPE-D owns:
+
+- safe synthetic validation exercises
+- AI infrastructure risk assessment
+- MCP/tool server risk assessment
+- agent skill risk assessment
+- memory poisoning and recall/writeback abuse checks
+- browser automation abuse checks
+- terminal command risk checks
+- graph robustness checks
+- detection/control packaging
+- verified run summaries for handoff
+
+SCOPE-D does not own:
+
+- runtime execution authority; AgentPlane owns it
+- policy admission authority; Policy Fabric owns it
+- Delivery Excellence scoreboards and KPI definitions
+- Memory Mesh runtime implementation
+- BearBrowser or TurtleTerm product behavior
+- SocioSphere topology authority
+
+## Risk-control lanes
+
+### SkillRiskAssessment
+
+Targets portable `SKILL.md` and governed SourceOS skill envelopes.
+
+Checks:
+
+- prompt-injection content
+- hidden tool instructions
+- unsafe script execution
+- filesystem overreach
+- network overreach
+- credential access requests
+- missing evals
+- missing threat model
+- missing license/provenance
+- unpinned dependencies
+- trust-tier mismatch
+
+### MCPServerRiskAssessment
+
+Targets MCP servers and tool namespaces.
+
+Checks:
+
+- tool schema drift
+- namespace collision
+- unpinned server version
+- unsafe transport
+- unauthenticated local endpoint
+- credential scope overreach
+- filesystem/network overreach
+- missing health check
+- prompt/tool poisoning surface
+- revocation behavior
+
+### BrowserAutomationRiskAssessment
+
+Targets BearBrowser/browser-use workflows.
+
+Checks:
+
+- credential exfiltration
+- CSRF/local-origin abuse
+- unauthorized form submit
+- stealth/evasion misuse
+- malicious download bypass
+- upload leakage
+- external message-send risk
+- account-setting mutation
+- page-content prompt injection
+- domain allowlist bypass
+
+### TerminalActionRiskAssessment
+
+Targets TurtleTerm, agent-term, shell receipts, and workstation contracts.
+
+Checks:
+
+- command injection
+- shell escape
+- destructive command bypass
+- privilege escalation
+- unauthorized filesystem mutation
+- secret exfiltration
+- package install risk
+- unauthorized service exposure
+- host/cluster mutation bypass
+- generated script risk
+
+### MemoryRiskAssessment
+
+Targets Memory Mesh and context-pack flows.
+
+Checks:
+
+- memory poisoning
+- cross-tenant recall bleed
+- sensitive-payload storage bypass
+- retrieval prompt injection
+- writeback abuse
+- redaction bypass
+- artifact pointer spoofing
+- vector-store drift
+- contradiction/drift propagation
+
+### GraphRobustnessAssessment
+
+Targets AgentPlane graphs, policy graphs, memory graphs, trust graphs, and evidence graphs.
+
+Checks:
+
+- unbounded loops
+- missing failure edges
+- unsafe retry paths
+- hidden side-effect nodes
+- judge confidence bypass
+- promotion gate bypass
+- graph injection
+- policy-edge inconsistency
+- dependency-cycle risk
+- missing rollback path
+
+### EvolutionPatchRiskAssessment
+
+Targets proposed graph/prompt/tool/skill/policy/code changes.
+
+Checks:
+
+- self-promotion attempt
+- hidden authority expansion
+- policy weakening
+- test removal
+- evidence removal
+- rollback removal
+- prompt injection in patch text
+- risky dependency introduction
+- supply-chain degradation
+
+## Evidence outputs
+
+Every SCOPE-D agent-harness risk run should emit:
+
+- risk assessment manifest
+- safe synthetic event stream
+- finding records
+- recommended controls
+- policy gate refs
+- affected asset refs
+- run receipt
+- verified run summary
+- Delivery Excellence projection fields
+
+## Delivery Excellence projection
+
+SCOPE-D should export or support projection into these Delivery Excellence metrics:
+
+- skill risk score
+- MCP server risk score
+- browser automation risk score
+- terminal action risk score
+- memory risk score
+- graph robustness score
+- open high-risk findings
+- blocked promotion count
+- verified-run count
+- control coverage count
+- defect/regression count
+
+Delivery Excellence consumes risk scores and verified summaries, not unsafe exploit payloads.
+
+## Policy Fabric integration
+
+Policy Fabric should consume SCOPE-D findings as inputs to:
+
+- SkillGrantGate
+- MCPGrantGate
+- BrowserActionGate
+- TerminalActionGate
+- MemoryGate
+- GraphAdmissionGate
+- PromotionGate
+
+High-risk or unverified assets should default to blocked, quarantined, or human-review-required posture.
+
+## AgentPlane integration
+
+AgentPlane should cite SCOPE-D risk results in:
+
+- EvidencePack
+- PromotionGate
+- FailureDiagnosis
+- EvolutionPatch review
+- graph/template/skill promotion records
+
+## Memory Mesh integration
+
+Memory-related findings should reference Memory Mesh artifact pointers and context-pack refs instead of raw sensitive payloads.
+
+## SourceOS integration
+
+SourceOS execution receipt classes should be SCOPE-D assessment targets:
+
+- LocalAgentRuntimeReceipt
+- ShellReceiptEvent
+- BrowserActionReceipt
+- ModelCarryRouteReceipt
+- HostMutationBoundaryReceipt
+- DownloadArtifactReceipt
+
+## Non-negotiables
+
+- SCOPE-D defaults to read-only, synthetic, and dry-run validation.
+- No deployable malware, C2 payloads, credential theft workflows, destructive automation, or unauthorized execution logic belongs in this repo.
+- Risk findings must preserve provenance and safe evidence.
+- Risk scores must be traceable to verified run summaries.
+- Delivery Excellence receives risk metrics and customer-safe summaries, not unsafe payloads.
+
+## Near-term implementation path
+
+1. Add schemas/examples for the assessment lanes above.
+2. Add safe synthetic fixtures for skill, MCP, browser, terminal, memory, graph, and evolution-patch risk.
+3. Extend verified run reporting with agent-harness risk fields.
+4. Add Delivery Excellence metric projection examples.
+5. Wire Policy Fabric gate docs to consume SCOPE-D risk results.
diff --git a/config/schemas/agent-harness-risk-assessment.schema.json b/config/schemas/agent-harness-risk-assessment.schema.json
@@ -0,0 +1,82 @@
+{
+  "$schema": "https://json-schema.org/draft/2020-12/schema",
+  "$id": "https://socioprophet.org/schemas/scope-d/agent-harness-risk-assessment.schema.json",
+  "title": "AgentHarnessRiskAssessment",
+  "type": "object",
+  "additionalProperties": false,
+  "required": [
+    "schemaVersion",
+    "assessmentId",
+    "assessmentMode",
+    "target",
+    "riskLanes",
+    "findings",
+    "safetyBoundary",
+    "deliveryProjection"
+  ],
+  "properties": {
+    "schemaVersion": { "const": "v0.1" },
+    "assessmentId": { "type": "string" },
+    "assessmentMode": { "type": "string", "enum": ["read_only", "synthetic_only", "dry_run"] },
+    "target": {
+      "type": "object",
+      "additionalProperties": false,
+      "required": ["assetRef", "assetType", "ownerRepo"],
+      "properties": {
+        "assetRef": { "type": "string" },
+        "assetType": { "type": "string", "enum": ["skill", "mcp-server", "browser-workflow", "terminal-workflow", "memory-flow", "agent-graph", "evolution-patch"] },
+        "ownerRepo": { "type": "string" }
+      }
+    },
+    "riskLanes": {
+      "type": "array",
+      "items": {
+        "type": "string",
+        "enum": ["skill", "mcp", "browser", "terminal", "memory", "graph", "evolution-patch"]
+      }
+    },
+    "findings": {
+      "type": "array",
+      "items": {
+        "type": "object",
+        "additionalProperties": false,
+        "required": ["findingId", "lane", "severity", "title", "evidenceRef", "recommendedControl"],
+        "properties": {
+          "findingId": { "type": "string" },
+          "lane": { "type": "string", "enum": ["skill", "mcp", "browser", "terminal", "memory", "graph", "evolution-patch"] },
+          "severity": { "type": "string", "enum": ["info", "low", "medium", "high", "critical"] },
+          "title": { "type": "string" },
+          "evidenceRef": { "type": "string" },
+          "recommendedControl": { "type": "string" }
+        }
+      }
+    },
+    "safetyBoundary": {
+      "type": "object",
+      "additionalProperties": false,
+      "required": ["liveActionsExecuted", "syntheticOnly", "credentialCollectionAllowed", "publicNetworkScanningAllowed", "destructiveActionsAllowed"],
+      "properties": {
+        "liveActionsExecuted": { "type": "integer" },
+        "syntheticOnly": { "type": "boolean" },
+        "credentialCollectionAllowed": { "type": "boolean" },
+        "publicNetworkScanningAllowed": { "type": "boolean" },
+        "destructiveActionsAllowed": { "type": "boolean" }
+      }
+    },
+    "policyFabricRefs": { "type": "array", "items": { "type": "string" } },
+    "agentplaneRefs": { "type": "array", "items": { "type": "string" } },
+    "memoryMeshRefs": { "type": "array", "items": { "type": "string" } },
+    "sourceosReceiptRefs": { "type": "array", "items": { "type": "string" } },
+    "deliveryProjection": {
+      "type": "object",
+      "additionalProperties": false,
+      "required": ["metricFamily", "riskScore", "scoreStatus", "deliveryMetricRefs"],
+      "properties": {
+        "metricFamily": { "const": "safety-security" },
+        "riskScore": { "type": "number" },
+        "scoreStatus": { "type": "string", "enum": ["green", "yellow", "red", "unknown"] },
+        "deliveryMetricRefs": { "type": "array", "items": { "type": "string" } }
+      }
+    }
+  }
+}
diff --git a/examples/scope-d/agent-harness-risk-assessment.example.json b/examples/scope-d/agent-harness-risk-assessment.example.json
@@ -0,0 +1,50 @@
+{
+  "schemaVersion": "v0.1",
+  "assessmentId": "agent-harness-risk-assessment-browser-terminal-v0.1",
+  "assessmentMode": "synthetic_only",
+  "target": {
+    "assetRef": "sourceos://tool-pack/browser-terminal-governed-surfaces",
+    "assetType": "browser-workflow",
+    "ownerRepo": "SourceOS-Linux/BearBrowser"
+  },
+  "riskLanes": ["browser", "terminal", "memory", "graph"],
+  "findings": [
+    {
+      "findingId": "finding-browser-form-submit-human-review",
+      "lane": "browser",
+      "severity": "medium",
+      "title": "Externally mutating browser actions require explicit human review.",
+      "evidenceRef": "github://SourceOS-Linux/BearBrowser/pull/22",
+      "recommendedControl": "Require BrowserActionGate and HumanControlEvent before live form-submit, upload, purchase/order, ticket creation, or message-send actions."
+    },
+    {
+      "findingId": "finding-terminal-host-mutation-gate",
+      "lane": "terminal",
+      "severity": "medium",
+      "title": "Host mutation must remain policy-gated and receipt-backed.",
+      "evidenceRef": "github://SourceOS-Linux/TurtleTerm/pull/5",
+      "recommendedControl": "Require TerminalActionGate, MutationReceipt, rollback reference, and operator approval for live host mutation."
+    }
+  ],
+  "safetyBoundary": {
+    "liveActionsExecuted": 0,
+    "syntheticOnly": true,
+    "credentialCollectionAllowed": false,
+    "publicNetworkScanningAllowed": false,
+    "destructiveActionsAllowed": false
+  },
+  "policyFabricRefs": ["github://SocioProphet/policy-fabric/pull/60"],
+  "agentplaneRefs": ["github://SocioProphet/agentplane/pull/107"],
+  "memoryMeshRefs": ["github://SocioProphet/memory-mesh/pull/23"],
+  "sourceosReceiptRefs": [
+    "github://SourceOS-Linux/sourceos-spec/pull/93",
+    "github://SourceOS-Linux/BearBrowser/pull/22",
+    "github://SourceOS-Linux/TurtleTerm/pull/5"
+  ],
+  "deliveryProjection": {
+    "metricFamily": "safety-security",
+    "riskScore": 62,
+    "scoreStatus": "yellow",
+    "deliveryMetricRefs": ["github://SocioProphet/delivery-excellence-automation/pull/7"]
+  }
+}