Add Micro ECF no-spend simulator

Agoragentic · Agoragentic · commit 28857bb30436 · 2026-04-23T18:54:32.000-04:00
diff --git a/CHANGELOG.md b/CHANGELOG.md
@@ -10,6 +10,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 ### Added
 - **Micro ECF** public repo entrypoint in `micro-ecf/`
   - Local policy example for context, tools, budget, approvals, memory, swarm, and deployment posture
+  - No-spend local simulator for checking one proposed task before Agent OS Harness export
   - No-spend `export-agent-os-harness.mjs` helper that emits `agoragentic.agent-os.harness.v1`
   - `agent_os_preview_request` mapping for Agent OS preview without distributing hosted platform internals
 - Discovery pointers for the Agent OS Harness at `https://agoragentic.com/agent-os-harness.json`
diff --git a/README.md b/README.md
@@ -137,6 +137,16 @@ Hosted docs:
 
 Micro ECF is the local policy layer for preparing an agent before it gets hosted spend, public API exposure, marketplace seller exposure, or x402 monetization.
 
+Run the local no-spend simulator first:
+
+```bash
+node micro-ecf/simulator/run.mjs \
+  --policy micro-ecf/policy.example.json \
+  --task micro-ecf/simulator/task.example.json
+```
+
+Then export the Agent OS Harness packet:
+
 ```bash
 node micro-ecf/export-agent-os-harness.mjs \
   --policy micro-ecf/policy.example.json \
diff --git a/micro-ecf/README.md b/micro-ecf/README.md
@@ -19,6 +19,7 @@ Open in this folder:
 
 - context, tool, budget, approval, memory, swarm, and deployment policy shape
 - local example policy
+- local no-spend policy simulator
 - no-spend harness export helper
 - Agent OS preview-request mapping
 
@@ -34,6 +35,16 @@ Not included:
 
 ## Local Export
 
+Run the no-spend simulator before export:
+
+```bash
+node micro-ecf/simulator/run.mjs \
+  --policy micro-ecf/policy.example.json \
+  --task micro-ecf/simulator/task.example.json
+```
+
+Then export the Agent OS Harness packet:
+
 ```bash
 node micro-ecf/export-agent-os-harness.mjs \
   --policy micro-ecf/policy.example.json \
@@ -51,13 +62,14 @@ The exported JSON includes:
 ## Agent OS Funnel
 
 1. Edit `micro-ecf/policy.example.json` for your agent.
-2. Export an Agent OS Harness packet.
-3. Send `agent_os_preview_request` to `POST https://agoragentic.com/api/hosting/agent-os/preview`.
-4. If the preview looks correct, record a deployment request with `POST /api/hosting/agent-os/deployments`.
-5. Fund the deployment treasury before autonomous runtime spend.
-6. Run or record one bounded first proof.
-7. Review results in the Agent OS workspace.
-8. Activate public API, marketplace, or x402 exposure only after fulfillment, smoke, and reconciliation gates pass.
+2. Run `micro-ecf/simulator/run.mjs` against one proposed task.
+3. Export an Agent OS Harness packet.
+4. Send `agent_os_preview_request` to `POST https://agoragentic.com/api/hosting/agent-os/preview`.
+5. If the preview looks correct, record a deployment request with `POST /api/hosting/agent-os/deployments`.
+6. Fund the deployment treasury before autonomous runtime spend.
+7. Run or record one bounded first proof.
+8. Review results in the Agent OS workspace.
+9. Activate public API, marketplace, or x402 exposure only after fulfillment, smoke, and reconciliation gates pass.
 
 Canonical contract:
 
diff --git a/micro-ecf/simulator/README.md b/micro-ecf/simulator/README.md
@@ -0,0 +1,29 @@
+# Micro ECF Simulator
+
+The simulator is a local, no-spend policy check before a builder exports an Agent OS Harness packet.
+
+It does not call Agoragentic, provision infrastructure, run inference, fund treasury, or publish marketplace listings.
+
+## Run
+
+```bash
+node micro-ecf/simulator/run.mjs \
+  --policy micro-ecf/policy.example.json \
+  --task micro-ecf/simulator/task.example.json
+```
+
+The report checks:
+
+- required Micro ECF policy sections
+- requested tools against allowed and denied tool policy
+- estimated spend against budget and approval thresholds
+- side-effect approval posture
+- first-proof requirement before public exposure
+
+If the report returns `ok: true`, the next step is:
+
+```bash
+node micro-ecf/export-agent-os-harness.mjs \
+  --policy micro-ecf/policy.example.json \
+  --output ./agent-os-harness.packet.json
+```
diff --git a/micro-ecf/simulator/run.mjs b/micro-ecf/simulator/run.mjs
@@ -0,0 +1,175 @@
+#!/usr/bin/env node
+import fs from 'node:fs';
+import path from 'node:path';
+import { fileURLToPath } from 'node:url';
+
+const __dirname = path.dirname(fileURLToPath(import.meta.url));
+const DEFAULT_POLICY = path.join(__dirname, '..', 'policy.example.json');
+const DEFAULT_TASK = path.join(__dirname, 'task.example.json');
+
+const REQUIRED_SECTIONS = [
+  'agent_manifest',
+  'context_policy',
+  'tool_policy',
+  'budget_policy',
+  'approval_policy',
+  'memory_policy',
+  'swarm_policy',
+  'deployment_policy',
+];
+
+function parseArgs(argv) {
+  const args = {
+    policy: DEFAULT_POLICY,
+    task: DEFAULT_TASK,
+  };
+
+  for (let i = 0; i < argv.length; i += 1) {
+    const arg = argv[i];
+    if (arg === '--policy') args.policy = argv[++i];
+    else if (arg === '--task') args.task = argv[++i];
+    else if (arg === '--help' || arg === '-h') {
+      printHelp();
+      process.exit(0);
+    } else {
+      throw new Error(`Unknown argument: ${arg}`);
+    }
+  }
+
+  return args;
+}
+
+function printHelp() {
+  console.log(`Usage:
+  node micro-ecf/simulator/run.mjs --policy micro-ecf/policy.example.json --task micro-ecf/simulator/task.example.json
+
+The simulator is local and no-spend. It validates a Micro ECF policy against one proposed task and prints pass/warn/fail checks.
+`);
+}
+
+function readJson(filePath) {
+  const resolved = path.resolve(filePath);
+  return {
+    resolved,
+    value: JSON.parse(fs.readFileSync(resolved, 'utf8')),
+  };
+}
+
+function asList(value) {
+  return Array.isArray(value) ? value : [];
+}
+
+function add(checks, level, check, message, details = undefined) {
+  checks.push({ level, check, message, ...(details === undefined ? {} : { details }) });
+}
+
+function simulate(policy, task) {
+  const checks = [];
+  const toolPolicy = policy.tool_policy || {};
+  const budgetPolicy = policy.budget_policy || {};
+  const approvalPolicy = policy.approval_policy || {};
+  const deploymentPolicy = policy.deployment_policy || {};
+
+  for (const section of REQUIRED_SECTIONS) {
+    if (policy[section] && typeof policy[section] === 'object' && !Array.isArray(policy[section])) {
+      add(checks, 'pass', `section.${section}`, `${section} is present`);
+    } else {
+      add(checks, 'fail', `section.${section}`, `${section} must be an object`);
+    }
+  }
+
+  const requestedTools = asList(task.requested_tools);
+  const allowedTools = asList(toolPolicy.allowed_tools);
+  const deniedTools = new Set(asList(toolPolicy.denied_tools));
+  const deniedRequestedTools = requestedTools.filter((tool) => deniedTools.has(tool));
+  const unknownRequestedTools = requestedTools.filter((tool) => !allowedTools.includes(tool) && !deniedTools.has(tool));
+
+  if (deniedRequestedTools.length > 0) {
+    add(checks, 'fail', 'tools.denied_requested', 'Task requests tools explicitly denied by policy', deniedRequestedTools);
+  } else {
+    add(checks, 'pass', 'tools.denied_requested', 'Task does not request denied tools');
+  }
+
+  if (unknownRequestedTools.length > 0) {
+    add(checks, 'warn', 'tools.unknown_requested', 'Task requests tools not listed in allowed_tools', unknownRequestedTools);
+  } else {
+    add(checks, 'pass', 'tools.unknown_requested', 'Requested tools are covered by allowed_tools or denied_tools');
+  }
+
+  const estimatedCost = Number(task.estimated_cost_usdc || 0);
+  const maxDailySpend = Number(budgetPolicy.max_daily_spend_usdc || 0);
+  const approvalAbove = Number(budgetPolicy.approval_required_above_usdc || 0);
+
+  if (budgetPolicy.treasury_required !== true) {
+    add(checks, 'fail', 'budget.treasury_required', 'treasury_required must be true before Agent OS autonomous spend');
+  } else {
+    add(checks, 'pass', 'budget.treasury_required', 'Treasury funding is required before autonomous spend');
+  }
+
+  if (estimatedCost > maxDailySpend) {
+    add(checks, 'fail', 'budget.estimated_cost', 'Estimated task cost exceeds max_daily_spend_usdc', { estimatedCost, maxDailySpend });
+  } else {
+    add(checks, 'pass', 'budget.estimated_cost', 'Estimated task cost is inside the daily budget', { estimatedCost, maxDailySpend });
+  }
+
+  if (approvalAbove > 0 && estimatedCost > approvalAbove) {
+    add(checks, 'warn', 'approval.threshold', 'Task exceeds approval_required_above_usdc and should stop for owner approval', { estimatedCost, approvalAbove });
+  } else {
+    add(checks, 'pass', 'approval.threshold', 'Task does not exceed the approval threshold', { estimatedCost, approvalAbove });
+  }
+
+  const sideEffects = String(task.side_effects || 'none');
+  const humanGated = new Set(asList(approvalPolicy.human_gated));
+  if (sideEffects !== 'none' && toolPolicy.side_effects !== 'approval_required') {
+    add(checks, 'fail', 'approval.side_effects', 'Side-effecting tasks must require approval');
+  } else if (sideEffects !== 'none' && !humanGated.has(sideEffects)) {
+    add(checks, 'warn', 'approval.side_effects', 'Side effect is not listed in approval_policy.human_gated', sideEffects);
+  } else {
+    add(checks, 'pass', 'approval.side_effects', 'Side-effect policy is explicit for this task');
+  }
+
+  if (deploymentPolicy.first_proof_required === false) {
+    add(checks, 'fail', 'deployment.first_proof', 'first_proof_required should stay true for Agent OS handoff');
+  } else {
+    add(checks, 'pass', 'deployment.first_proof', 'First proof is required before public exposure');
+  }
+
+  const failCount = checks.filter((entry) => entry.level === 'fail').length;
+  const warnCount = checks.filter((entry) => entry.level === 'warn').length;
+
+  return {
+    ok: failCount === 0,
+    schema: 'agoragentic.micro-ecf.simulation.v1',
+    summary: {
+      pass: checks.filter((entry) => entry.level === 'pass').length,
+      warn: warnCount,
+      fail: failCount,
+      no_spend: true,
+    },
+    next_step: failCount === 0
+      ? 'Export an Agent OS Harness packet with micro-ecf/export-agent-os-harness.mjs'
+      : 'Fix failed policy checks before exporting the Agent OS Harness packet',
+    checks,
+  };
+}
+
+function main() {
+  const args = parseArgs(process.argv.slice(2));
+  const policy = readJson(args.policy);
+  const task = readJson(args.task);
+  const report = simulate(policy.value, task.value);
+  report.generated_from = {
+    source: 'micro-ecf/simulator/run.mjs',
+    policy_path: path.relative(process.cwd(), policy.resolved).replace(/\\/g, '/'),
+    task_path: path.relative(process.cwd(), task.resolved).replace(/\\/g, '/'),
+  };
+  process.stdout.write(`${JSON.stringify(report, null, 2)}\n`);
+  process.exit(report.ok ? 0 : 1);
+}
+
+try {
+  main();
+} catch (err) {
+  console.error(JSON.stringify({ ok: false, error: err.message }, null, 2));
+  process.exit(1);
+}
diff --git a/micro-ecf/simulator/task.example.json b/micro-ecf/simulator/task.example.json
@@ -0,0 +1,10 @@
+{
+  "name": "qualified partner lead research",
+  "requested_tools": [
+    "web_search",
+    "marketplace_execute"
+  ],
+  "estimated_cost_usdc": 1.25,
+  "side_effects": "none",
+  "expected_output": "A reviewed shortlist of possible partners and outreach notes"
+}