{
  "schema_version": "claim_to_evidence_table_v0",
  "updated": "2026-05-27",
  "public_private_boundary": "Public rows expose bounded claims, public artifacts, known limits, and repair routes. They do not expose private financial execution details, customer data, internal agent orchestration, commercial schedulers, API keys, or anonymous conference packages.",
  "rows": [
    {
      "claim_id": "P02-C1",
      "claim": "WisdomBench measures longitudinal learning from failure rather than single-shot task capability.",
      "evidence_ids": [
        "E-P02-3600",
        "E-P02-ARTIFACT"
      ],
      "evidence_status": "public_supporting",
      "public_artifacts": [
        "https://github.com/mmjbds/wisdombench",
        "https://huggingface.co/datasets/MMJBDS/wisdombench",
        "https://zenodo.org/records/19793098"
      ],
      "does_not_prove": "Human-like wisdom, general deployment reliability, or that all agents learn from failure.",
      "downgrade_trigger": "If task leakage, scoring bugs, reproduction failure, or stronger baselines remove the longitudinal effect.",
      "attack_routes": [
        "data leakage",
        "stronger baseline",
        "reproduction failure",
        "claim boundary too broad"
      ],
      "counterexample_route": "https://github.com/mmjbds/wisdombench/issues/new/choose"
    },
    {
      "claim_id": "PCA-C1",
      "claim": "High-risk AI action should not earn action credit until warrant and receipt closure exist.",
      "evidence_ids": [
        "E-PCA-MINI-GATE",
        "E-PCA-PUBLIC-REPO"
      ],
      "evidence_status": "public_protocol_and_interface_demo",
      "public_artifacts": [
        "https://github.com/mmjbds/proof-carrying-action",
        "https://mmjbds-mianzhang-org.static.hf.space/demos/proof-action-mini/index.html"
      ],
      "does_not_prove": "Live trading profit, private product performance, or universal safety.",
      "downgrade_trigger": "If the public gate allows unsafe action, gives credit without receipts, or cannot reproduce its no-go boundary.",
      "attack_routes": [
        "false no-go",
        "missing receipt",
        "credit leak",
        "unsafe action allowed"
      ],
      "counterexample_route": "https://github.com/mmjbds/proof-carrying-action/issues/new/choose"
    },
    {
      "claim_id": "P24-C1",
      "claim": "Adaptive systems need relational observability: relations, constraints, control debt, and evidence half-life, not scalar score alone.",
      "evidence_ids": [
        "E-P24-PROTOCOL",
        "E-REGISTRY-LAYER"
      ],
      "evidence_status": "public_protocol_stage",
      "public_artifacts": [
        "https://mmjbds-mianzhang-org.static.hf.space/technology/index.html",
        "https://mmjbds-mianzhang-org.static.hf.space/registries/index.html",
        "https://mmjbds-mianzhang-org.static.hf.space/evidence/index.html"
      ],
      "does_not_prove": "A theorem covering all adaptive systems or a finished private product.",
      "downgrade_trigger": "If relation variables, control debt, or evidence half-life do not change decisions beyond scalar baselines.",
      "attack_routes": [
        "unmeasured relation variable",
        "unmeasured control debt",
        "failed transfer",
        "strong scalar baseline"
      ],
      "counterexample_route": "https://mmjbds-mianzhang-org.static.hf.space/counterexamples/index.html"
    },
    {
      "claim_id": "P20-C1",
      "claim": "Physical AI should route degraded evidence to recovery or abstention rather than direct action.",
      "evidence_ids": [
        "E-P20-STRESS-PANEL",
        "E-P20-BOUNDARY"
      ],
      "evidence_status": "public_bounded_support_and_rebuild_needed",
      "public_artifacts": [
        "https://zenodo.org/records/20097570",
        "https://mmjbds-mianzhang-org.static.hf.space/counterexamples/index.html"
      ],
      "does_not_prove": "Detector SOTA, offensive autonomy, or real-world robot deployment performance.",
      "downgrade_trigger": "If stronger conformal, shield, or fusion baselines handle the same degraded evidence without the proposed boundary.",
      "attack_routes": [
        "independent public dataset",
        "stronger conformal/shield baseline",
        "real log mismatch",
        "action coverage tradeoff"
      ],
      "counterexample_route": "https://mmjbds-mianzhang-org.static.hf.space/counterexamples/index.html"
    },
    {
      "claim_id": "F1-C1",
      "claim": "Trading is used as a high-risk testbed for proof-carrying action discipline, not as a public claim of live profitability.",
      "evidence_ids": [
        "E-F1-NOGO",
        "E-F1-SCHEMA"
      ],
      "evidence_status": "public_boundary_and_private_briefing_route",
      "public_artifacts": [
        "https://zenodo.org/records/20156365",
        "https://mmjbds-mianzhang-org.static.hf.space/private-briefing/pilot-packet.html"
      ],
      "does_not_prove": "Live trading edge, customer readiness, private execution quality, or alpha dominance.",
      "downgrade_trigger": "If public language implies live profitability, private execution readiness, or authority beyond no-go evidence.",
      "attack_routes": [
        "claim boundary too broad",
        "missing public schema",
        "no-go misinterpreted",
        "credit leak"
      ],
      "counterexample_route": "https://github.com/mmjbds/proof-carrying-action/issues/new/choose"
    }
  ]
}
