{
  "schema_version": "2026-05-27.agent-task-ledger.v1",
  "name": "TokRepo Agent Task Run Ledger Eval",
  "canonical_url": "https://tokrepo.com/evals/agent-task-ledger.json",
  "updated_at": "2026-05-27",
  "generated_by": "node scripts/run_agent_task_ledger.mjs --json",
  "purpose": "Public, deterministic task-run ledger evidence for long-running, recurring, and delayed agent work. Each run records owner, schedule, status, latest evidence, next action, and rollback or handoff state.",
  "state_contract": {
    "required_fields": [
      "owner",
      "schedule",
      "status",
      "latest_evidence",
      "next_action",
      "rollback_or_handoff"
    ],
    "lifecycle_boundary": "A long-running task is not complete unless state and evidence survive across sessions.",
    "privacy_boundary": "No task text, file contents, access tokens, or private asset content are required in the public ledger."
  },
  "metrics": {
    "runs_total": 3,
    "runs_with_full_state": 3,
    "long_running_task_state_coverage_pct": 100,
    "evidence_attached_pct": 100,
    "stale_or_blocked_runs": 0
  },
  "task_runs": [
    {
      "run_id": "taskrun_agent_discovery_smoke_daily",
      "task": "Run daily agent discovery smoke and verify machine-readable surfaces before the next release window.",
      "task_type": "recurring_verification",
      "owner": "tokrepo-release-agent",
      "schedule": {
        "type": "daily",
        "cadence": "P1D",
        "timezone": "UTC",
        "next_run_at": "2026-05-28T00:20:00Z"
      },
      "status": "healthy",
      "latest_evidence": {
        "checked_at": "2026-05-27T02:46:00Z",
        "command": "WEB_BASE=https://tokrepo.com API_BASE=https://api.tokrepo.com node scripts/production-agent-discovery-check.mjs",
        "verdict": "pass_with_warning",
        "warning": "WARN_EXTERNAL_REGISTRY_LAG",
        "evidence_url": "https://tokrepo.com/.well-known/tokrepo.json"
      },
      "next_action": "Rerun after the external MCP Registry catches up to live manifest 2.16.1.",
      "rollback_or_handoff": {
        "type": "handoff",
        "target": "skills/codex-skill/tokrepo-product-test/SKILL.md",
        "trigger": "machine-readable endpoint regression or external registry lag persists past the next release window"
      },
      "lifecycle_gates": [
        "detect_high_value_task",
        "evaluate_task_outcome",
        "record_memory_and_state",
        "measure_task_economics"
      ],
      "state_snapshot": {
        "owner": "tokrepo-release-agent",
        "schedule": {
          "type": "daily",
          "cadence": "P1D",
          "timezone": "UTC",
          "next_run_at": "2026-05-28T00:20:00Z"
        },
        "status": "healthy",
        "latest_evidence": {
          "checked_at": "2026-05-27T02:46:00Z",
          "command": "WEB_BASE=https://tokrepo.com API_BASE=https://api.tokrepo.com node scripts/production-agent-discovery-check.mjs",
          "verdict": "pass_with_warning",
          "warning": "WARN_EXTERNAL_REGISTRY_LAG",
          "evidence_url": "https://tokrepo.com/.well-known/tokrepo.json"
        },
        "next_action": "Rerun after the external MCP Registry catches up to live manifest 2.16.1.",
        "rollback_or_handoff": {
          "type": "handoff",
          "target": "skills/codex-skill/tokrepo-product-test/SKILL.md",
          "trigger": "machine-readable endpoint regression or external registry lag persists past the next release window"
        }
      },
      "coverage": {
        "pass": true,
        "checks": [
          {
            "id": "state_field:owner",
            "pass": true
          },
          {
            "id": "state_field:schedule",
            "pass": true
          },
          {
            "id": "state_field:status",
            "pass": true
          },
          {
            "id": "state_field:latest_evidence",
            "pass": true
          },
          {
            "id": "state_field:next_action",
            "pass": true
          },
          {
            "id": "state_field:rollback_or_handoff",
            "pass": true
          },
          {
            "id": "schedule_has_next_run_at",
            "pass": true
          },
          {
            "id": "latest_evidence_has_verdict",
            "pass": true
          },
          {
            "id": "rollback_or_handoff_has_trigger",
            "pass": true
          }
        ]
      }
    },
    {
      "run_id": "taskrun_private_harvest_review_weekly",
      "task": "Review completed agent work for reusable private drafts without publishing user data or local-only secrets.",
      "task_type": "recurring_supply_harvest",
      "owner": "tokrepo-harvest-agent",
      "schedule": {
        "type": "weekly",
        "cadence": "P1W",
        "timezone": "UTC",
        "next_run_at": "2026-06-01T03:00:00Z"
      },
      "status": "ready",
      "latest_evidence": {
        "checked_at": "2026-05-27T02:47:00Z",
        "command": "node scripts/run_agent_task_harness.mjs --check-public",
        "verdict": "pass",
        "evidence_url": "https://tokrepo.com/evals/agent-task-harness.json"
      },
      "next_action": "Run tokrepo_harvest on changed reusable scripts, keep drafts private, and require quality_gate.status=pass before handoff.",
      "rollback_or_handoff": {
        "type": "rollback",
        "command": "tokrepo rollback --last --target codex --dry-run --json",
        "trigger": "quality gate fails or sensitive_findings is nonzero"
      },
      "lifecycle_gates": [
        "harvest_reusable_work",
        "record_memory_and_state",
        "measure_task_economics"
      ],
      "state_snapshot": {
        "owner": "tokrepo-harvest-agent",
        "schedule": {
          "type": "weekly",
          "cadence": "P1W",
          "timezone": "UTC",
          "next_run_at": "2026-06-01T03:00:00Z"
        },
        "status": "ready",
        "latest_evidence": {
          "checked_at": "2026-05-27T02:47:00Z",
          "command": "node scripts/run_agent_task_harness.mjs --check-public",
          "verdict": "pass",
          "evidence_url": "https://tokrepo.com/evals/agent-task-harness.json"
        },
        "next_action": "Run tokrepo_harvest on changed reusable scripts, keep drafts private, and require quality_gate.status=pass before handoff.",
        "rollback_or_handoff": {
          "type": "rollback",
          "command": "tokrepo rollback --last --target codex --dry-run --json",
          "trigger": "quality gate fails or sensitive_findings is nonzero"
        }
      },
      "coverage": {
        "pass": true,
        "checks": [
          {
            "id": "state_field:owner",
            "pass": true
          },
          {
            "id": "state_field:schedule",
            "pass": true
          },
          {
            "id": "state_field:status",
            "pass": true
          },
          {
            "id": "state_field:latest_evidence",
            "pass": true
          },
          {
            "id": "state_field:next_action",
            "pass": true
          },
          {
            "id": "state_field:rollback_or_handoff",
            "pass": true
          },
          {
            "id": "schedule_has_next_run_at",
            "pass": true
          },
          {
            "id": "latest_evidence_has_verdict",
            "pass": true
          },
          {
            "id": "rollback_or_handoff_has_trigger",
            "pass": true
          }
        ]
      }
    },
    {
      "run_id": "taskrun_delayed_chrome_mcp_recheck",
      "task": "Recheck Chrome MCP proxy health after a delayed reconnect or browser restart.",
      "task_type": "delayed_followup",
      "owner": "tokrepo-browser-ops-agent",
      "schedule": {
        "type": "delayed",
        "cadence": "PT30M",
        "timezone": "local",
        "next_run_at": "2026-05-27T03:30:00Z"
      },
      "status": "needs_recheck",
      "latest_evidence": {
        "checked_at": "2026-05-27T03:10:00Z",
        "command": "curl --noproxy \"*\" http://127.0.0.1:9401/proxy/status",
        "verdict": "pass_proxy_connected",
        "evidence_url": "local:chrome-mcp-proxy-status"
      },
      "next_action": "If MCP stdio transport is closed in the current agent session, reconnect the MCP server or start a fresh Codex session before browser-dependent validation.",
      "rollback_or_handoff": {
        "type": "handoff",
        "target": "Chrome MCP 完整运维 Skill",
        "trigger": "mcp__chrome__ list_pages reports Transport closed after proxy health is green"
      },
      "lifecycle_gates": [
        "plan_safe_run",
        "execute_or_stage",
        "evaluate_task_outcome",
        "record_memory_and_state"
      ],
      "state_snapshot": {
        "owner": "tokrepo-browser-ops-agent",
        "schedule": {
          "type": "delayed",
          "cadence": "PT30M",
          "timezone": "local",
          "next_run_at": "2026-05-27T03:30:00Z"
        },
        "status": "needs_recheck",
        "latest_evidence": {
          "checked_at": "2026-05-27T03:10:00Z",
          "command": "curl --noproxy \"*\" http://127.0.0.1:9401/proxy/status",
          "verdict": "pass_proxy_connected",
          "evidence_url": "local:chrome-mcp-proxy-status"
        },
        "next_action": "If MCP stdio transport is closed in the current agent session, reconnect the MCP server or start a fresh Codex session before browser-dependent validation.",
        "rollback_or_handoff": {
          "type": "handoff",
          "target": "Chrome MCP 完整运维 Skill",
          "trigger": "mcp__chrome__ list_pages reports Transport closed after proxy health is green"
        }
      },
      "coverage": {
        "pass": true,
        "checks": [
          {
            "id": "state_field:owner",
            "pass": true
          },
          {
            "id": "state_field:schedule",
            "pass": true
          },
          {
            "id": "state_field:status",
            "pass": true
          },
          {
            "id": "state_field:latest_evidence",
            "pass": true
          },
          {
            "id": "state_field:next_action",
            "pass": true
          },
          {
            "id": "state_field:rollback_or_handoff",
            "pass": true
          },
          {
            "id": "schedule_has_next_run_at",
            "pass": true
          },
          {
            "id": "latest_evidence_has_verdict",
            "pass": true
          },
          {
            "id": "rollback_or_handoff_has_trigger",
            "pass": true
          }
        ]
      }
    }
  ]
}
