{
  "schema": "coeval-task-001-dashboard-v1",
  "ts": "2026-06-10T07:54:49Z",
  "task": "co-eval-task-001",
  "phase_status": {
    "phase": "done",
    "round": 40,
    "paused": false,
    "abort_requested": false,
    "benchmark_version": "3.2",
    "fire_at": 1779182192,
    "last_change_at": 1779285566,
    "winner_foss": "AE-autoqueued-llama3.2-latest",
    "winner_nonfoss": "bare-chatgpt-best"
  },
  "participants": {
    "total": 52,
    "foss": 48,
    "non_foss": 4
  },
  "leaderboard": [
    {
      "de": "bare-chatgpt-best",
      "rolling_mean": 5.91,
      "std": 0.878,
      "n_samples": 90,
      "group": "foss"
    },
    {
      "de": "AE-chatgpt-best",
      "rolling_mean": 5.41,
      "std": 1.586,
      "n_samples": 160,
      "group": "foss"
    },
    {
      "de": "AE-claude-best",
      "rolling_mean": 5.371,
      "std": 0.924,
      "n_samples": 90,
      "group": "non-foss"
    },
    {
      "de": "bare-chatgpt-cheap",
      "rolling_mean": 5.286,
      "std": 0.709,
      "n_samples": 90,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-llama3.2-latest",
      "rolling_mean": 5.225,
      "std": 1.348,
      "n_samples": 200,
      "group": "foss"
    },
    {
      "de": "AE-claude-cheap",
      "rolling_mean": 5.122,
      "std": 0.992,
      "n_samples": 90,
      "group": "non-foss"
    },
    {
      "de": "AE-autoqueued-granite4.1-8b",
      "rolling_mean": 4.787,
      "std": 1.535,
      "n_samples": 202,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-llama3.1-8b",
      "rolling_mean": 4.676,
      "std": 1.382,
      "n_samples": 180,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-qwen2.5-coder-7b",
      "rolling_mean": 4.628,
      "std": 1.777,
      "n_samples": 200,
      "group": "foss"
    },
    {
      "de": "AE-flagship-v4",
      "rolling_mean": 4.5,
      "std": 1.263,
      "n_samples": 205,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-deepseek-r1-14b",
      "rolling_mean": 4.45,
      "std": 1.481,
      "n_samples": 205,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-devstral-24b",
      "rolling_mean": 4.422,
      "std": 1.574,
      "n_samples": 205,
      "group": "foss"
    },
    {
      "de": "AE-c4-B",
      "rolling_mean": 4.42,
      "std": 1.334,
      "n_samples": 205,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-deepseek-r1-1.5b",
      "rolling_mean": 4.388,
      "std": 0.897,
      "n_samples": 190,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-granite4.1-3b",
      "rolling_mean": 4.372,
      "std": 1.4,
      "n_samples": 205,
      "group": "foss"
    },
    {
      "de": "AE-c3-A",
      "rolling_mean": 4.332,
      "std": 2.052,
      "n_samples": 147,
      "group": "foss"
    },
    {
      "de": "AE-c4-A",
      "rolling_mean": 4.288,
      "std": 1.623,
      "n_samples": 202,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-gemma4-latest",
      "rolling_mean": 4.253,
      "std": 1.666,
      "n_samples": 204,
      "group": "foss"
    },
    {
      "de": "AE-c2-A",
      "rolling_mean": 4.188,
      "std": 1.82,
      "n_samples": 188,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-mistral-nemo-12b",
      "rolling_mean": 4.16,
      "std": 1.82,
      "n_samples": 201,
      "group": "foss"
    },
    {
      "de": "AE-flagship-v3",
      "rolling_mean": 4.126,
      "std": 1.49,
      "n_samples": 203,
      "group": "foss"
    },
    {
      "de": "AE-c5-A",
      "rolling_mean": 4.064,
      "std": 1.268,
      "n_samples": 203,
      "group": "foss"
    },
    {
      "de": "AE-c5-B",
      "rolling_mean": 4.042,
      "std": 1.523,
      "n_samples": 202,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-qwen2.5-coder-14b",
      "rolling_mean": 4.021,
      "std": 2.051,
      "n_samples": 193,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-phi4-14b",
      "rolling_mean": 4.003,
      "std": 1.876,
      "n_samples": 200,
      "group": "foss"
    },
    {
      "de": "AE-chatgpt-cheap",
      "rolling_mean": 3.995,
      "std": 1.486,
      "n_samples": 202,
      "group": "foss"
    },
    {
      "de": "AE-flagship-v2",
      "rolling_mean": 3.952,
      "std": 1.348,
      "n_samples": 180,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-phi4-latest",
      "rolling_mean": 3.919,
      "std": 1.847,
      "n_samples": 200,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-deepseek-r1-8b",
      "rolling_mean": 3.909,
      "std": 1.68,
      "n_samples": 195,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-glm4-9b",
      "rolling_mean": 3.888,
      "std": 1.633,
      "n_samples": 205,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-hermes3-8b",
      "rolling_mean": 3.782,
      "std": 1.781,
      "n_samples": 201,
      "group": "foss"
    },
    {
      "de": "AE-c3-B",
      "rolling_mean": 3.706,
      "std": 1.788,
      "n_samples": 197,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-falcon3-1b",
      "rolling_mean": 3.644,
      "std": 1.65,
      "n_samples": 204,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-gemma3-latest",
      "rolling_mean": 3.535,
      "std": 1.632,
      "n_samples": 204,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-hermes3-3b",
      "rolling_mean": 3.532,
      "std": 1.832,
      "n_samples": 201,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-opencoder-1.5b",
      "rolling_mean": 3.428,
      "std": 1.649,
      "n_samples": 205,
      "group": "foss"
    },
    {
      "de": "AE-c2-B",
      "rolling_mean": 3.4,
      "std": 1.684,
      "n_samples": 168,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-smollm2-1.7b",
      "rolling_mean": 3.397,
      "std": 1.591,
      "n_samples": 197,
      "group": "foss"
    },
    {
      "de": "AE-c1-B",
      "rolling_mean": 3.317,
      "std": 1.877,
      "n_samples": 159,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-stablelm2-1.6b",
      "rolling_mean": 2.969,
      "std": 1.793,
      "n_samples": 153,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-smollm2-360m",
      "rolling_mean": 2.848,
      "std": 1.966,
      "n_samples": 152,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-phi3.5-3.8b",
      "rolling_mean": 2.699,
      "std": 1.786,
      "n_samples": 192,
      "group": "foss"
    },
    {
      "de": "AE-autoqueued-olmo2-7b",
      "rolling_mean": 2.63,
      "std": 2.017,
      "n_samples": 184,
      "group": "foss"
    },
    {
      "de": "AE-c1-A",
      "rolling_mean": 2.607,
      "std": 2.206,
      "n_samples": 200,
      "group": "foss"
    }
  ],
  "convergence": {
    "cleaned_v3_1": [
      {
        "pair": "r0->r1",
        "tmean_clean": 0.16518452708677228,
        "tmean_rel": 0.1255164337484897,
        "n0_flip": 44,
        "n_clean": 196,
        "over_clean": 145
      },
      {
        "pair": "r1->r2",
        "tmean_clean": 0.14087665585852532,
        "tmean_rel": 0.1074881213505348,
        "n0_flip": 44,
        "n_clean": 196,
        "over_clean": 132
      },
      {
        "pair": "r2->r3",
        "tmean_clean": 0.13442557582099335,
        "tmean_rel": 0.10488702931027973,
        "n0_flip": 46,
        "n_clean": 194,
        "over_clean": 139
      },
      {
        "pair": "r3->r4",
        "tmean_clean": 0.21170896978670933,
        "tmean_rel": 0.17026329845280327,
        "n0_flip": 45,
        "n_clean": 190,
        "over_clean": 153
      },
      {
        "pair": "r4->r5",
        "tmean_clean": 0.25799009954864466,
        "tmean_rel": 0.2436221926435666,
        "n0_flip": 51,
        "n_clean": 184,
        "over_clean": 152
      },
      {
        "pair": "r5->r6",
        "tmean_clean": 0.3243658046565541,
        "tmean_rel": 0.3175984523801517,
        "n0_flip": 59,
        "n_clean": 171,
        "over_clean": 135
      },
      {
        "pair": "r6->r7",
        "tmean_clean": 0.21994540694998424,
        "tmean_rel": 0.17973919180882825,
        "n0_flip": 61,
        "n_clean": 164,
        "over_clean": 119
      },
      {
        "pair": "r7->r8",
        "tmean_clean": 0.19898449914342856,
        "tmean_rel": 0.1593935658571341,
        "n0_flip": 67,
        "n_clean": 168,
        "over_clean": 122
      },
      {
        "pair": "r8->r9",
        "tmean_clean": 0.22248010691030334,
        "tmean_rel": 0.219721659758363,
        "n0_flip": 66,
        "n_clean": 169,
        "over_clean": 128
      },
      {
        "pair": "r9->r10",
        "tmean_clean": 0.1570663883052538,
        "tmean_rel": 0.1380357623326577,
        "n0_flip": 52,
        "n_clean": 183,
        "over_clean": 109
      },
      {
        "pair": "r10->r11",
        "tmean_clean": 0.15949777806688722,
        "tmean_rel": 0.13283423890952015,
        "n0_flip": 51,
        "n_clean": 184,
        "over_clean": 117
      },
      {
        "pair": "r11->r12",
        "tmean_clean": 0.27721117738367773,
        "tmean_rel": 0.2532452925051025,
        "n0_flip": 58,
        "n_clean": 172,
        "over_clean": 121
      },
      {
        "pair": "r12->r13",
        "tmean_clean": 0.20519304108135178,
        "tmean_rel": 0.24115541511143077,
        "n0_flip": 70,
        "n_clean": 155,
        "over_clean": 104
      },
      {
        "pair": "r13->r14",
        "tmean_clean": 0.27504477443406355,
        "tmean_rel": 0.3042727960288155,
        "n0_flip": 68,
        "n_clean": 162,
        "over_clean": 103
      },
      {
        "pair": "r14->r15",
        "tmean_clean": 0.35070631486377946,
        "tmean_rel": 0.28221245978929443,
        "n0_flip": 57,
        "n_clean": 173,
        "over_clean": 118
      },
      {
        "pair": "r15->r16",
        "tmean_clean": 0.7908239323660623,
        "tmean_rel": 0.6564517205351137,
        "n0_flip": 63,
        "n_clean": 172,
        "over_clean": 112
      },
      {
        "pair": "r16->r17",
        "tmean_clean": 0.2990889675226553,
        "tmean_rel": 0.2769478810147933,
        "n0_flip": 71,
        "n_clean": 159,
        "over_clean": 121
      },
      {
        "pair": "r17->r18",
        "tmean_clean": 0.31242754906502623,
        "tmean_rel": 0.3213729843170188,
        "n0_flip": 70,
        "n_clean": 160,
        "over_clean": 125
      },
      {
        "pair": "r18->r19",
        "tmean_clean": 0.24036273963945312,
        "tmean_rel": 0.2927646639967077,
        "n0_flip": 69,
        "n_clean": 161,
        "over_clean": 103
      },
      {
        "pair": "r19->r20",
        "tmean_clean": 0.3164800117186526,
        "tmean_rel": 0.27742800259846034,
        "n0_flip": 68,
        "n_clean": 167,
        "over_clean": 116
      },
      {
        "pair": "r20->r21",
        "tmean_clean": 0.4717806573286166,
        "tmean_rel": 0.399989413183987,
        "n0_flip": 63,
        "n_clean": 177,
        "over_clean": 111
      },
      {
        "pair": "r21->r22",
        "tmean_clean": 0.17996939002122606,
        "tmean_rel": 0.17226334610989563,
        "n0_flip": 68,
        "n_clean": 167,
        "over_clean": 99
      }
    ],
    "live_v3_2_or_current": [
      {
        "pair": "r0->r1",
        "tmean_clean": 0.16518452708677228,
        "tmean_rel": 0.1255164337484897,
        "n0_flip": 44,
        "n_clean": 196,
        "over_clean": 145
      },
      {
        "pair": "r1->r2",
        "tmean_clean": 0.14087665585852532,
        "tmean_rel": 0.1074881213505348,
        "n0_flip": 44,
        "n_clean": 196,
        "over_clean": 132
      },
      {
        "pair": "r2->r3",
        "tmean_clean": 0.13442557582099335,
        "tmean_rel": 0.10488702931027973,
        "n0_flip": 46,
        "n_clean": 194,
        "over_clean": 139
      },
      {
        "pair": "r3->r4",
        "tmean_clean": 0.21170896978670933,
        "tmean_rel": 0.17026329845280327,
        "n0_flip": 45,
        "n_clean": 190,
        "over_clean": 153
      },
      {
        "pair": "r4->r5",
        "tmean_clean": 0.25799009954864466,
        "tmean_rel": 0.2436221926435666,
        "n0_flip": 51,
        "n_clean": 184,
        "over_clean": 152
      },
      {
        "pair": "r5->r6",
        "tmean_clean": 0.3243658046565541,
        "tmean_rel": 0.3175984523801517,
        "n0_flip": 59,
        "n_clean": 171,
        "over_clean": 135
      },
      {
        "pair": "r6->r7",
        "tmean_clean": 0.21994540694998424,
        "tmean_rel": 0.17973919180882825,
        "n0_flip": 61,
        "n_clean": 164,
        "over_clean": 119
      },
      {
        "pair": "r7->r8",
        "tmean_clean": 0.19898449914342856,
        "tmean_rel": 0.1593935658571341,
        "n0_flip": 67,
        "n_clean": 168,
        "over_clean": 122
      },
      {
        "pair": "r8->r9",
        "tmean_clean": 0.22248010691030334,
        "tmean_rel": 0.219721659758363,
        "n0_flip": 66,
        "n_clean": 169,
        "over_clean": 128
      },
      {
        "pair": "r9->r10",
        "tmean_clean": 0.1570663883052538,
        "tmean_rel": 0.1380357623326577,
        "n0_flip": 52,
        "n_clean": 183,
        "over_clean": 109
      },
      {
        "pair": "r10->r11",
        "tmean_clean": 0.15949777806688722,
        "tmean_rel": 0.13283423890952015,
        "n0_flip": 51,
        "n_clean": 184,
        "over_clean": 117
      },
      {
        "pair": "r11->r12",
        "tmean_clean": 0.27721117738367773,
        "tmean_rel": 0.2532452925051025,
        "n0_flip": 58,
        "n_clean": 172,
        "over_clean": 121
      },
      {
        "pair": "r12->r13",
        "tmean_clean": 0.20519304108135178,
        "tmean_rel": 0.24115541511143077,
        "n0_flip": 70,
        "n_clean": 155,
        "over_clean": 104
      },
      {
        "pair": "r13->r14",
        "tmean_clean": 0.27504477443406355,
        "tmean_rel": 0.3042727960288155,
        "n0_flip": 68,
        "n_clean": 162,
        "over_clean": 103
      },
      {
        "pair": "r14->r15",
        "tmean_clean": 0.35070631486377946,
        "tmean_rel": 0.28221245978929443,
        "n0_flip": 57,
        "n_clean": 173,
        "over_clean": 118
      },
      {
        "pair": "r15->r16",
        "tmean_clean": 0.7908239323660623,
        "tmean_rel": 0.6564517205351137,
        "n0_flip": 63,
        "n_clean": 172,
        "over_clean": 112
      },
      {
        "pair": "r16->r17",
        "tmean_clean": 0.2990889675226553,
        "tmean_rel": 0.2769478810147933,
        "n0_flip": 71,
        "n_clean": 159,
        "over_clean": 121
      },
      {
        "pair": "r17->r18",
        "tmean_clean": 0.31242754906502623,
        "tmean_rel": 0.3213729843170188,
        "n0_flip": 70,
        "n_clean": 160,
        "over_clean": 125
      },
      {
        "pair": "r18->r19",
        "tmean_clean": 0.24036273963945312,
        "tmean_rel": 0.2927646639967077,
        "n0_flip": 69,
        "n_clean": 161,
        "over_clean": 103
      },
      {
        "pair": "r19->r20",
        "tmean_clean": 0.3164800117186526,
        "tmean_rel": 0.27742800259846034,
        "n0_flip": 68,
        "n_clean": 167,
        "over_clean": 116
      },
      {
        "pair": "r20->r21",
        "tmean_clean": 0.4717806573286166,
        "tmean_rel": 0.399989413183987,
        "n0_flip": 63,
        "n_clean": 177,
        "over_clean": 111
      },
      {
        "pair": "r21->r22",
        "tmean_clean": 0.17996939002122606,
        "tmean_rel": 0.17226334610989563,
        "n0_flip": 68,
        "n_clean": 167,
        "over_clean": 99
      },
      {
        "pair": "r22->r23",
        "tmean_clean": 0.33997435819955624,
        "tmean_rel": 0.3515744018389571,
        "n0_flip": 72,
        "n_clean": 163,
        "over_clean": 144
      },
      {
        "pair": "r23->r24",
        "tmean_clean": 0.5595972268942627,
        "tmean_rel": 0.5329055871400552,
        "n0_flip": 56,
        "n_clean": 204,
        "over_clean": 179
      },
      {
        "pair": "r24->r25",
        "tmean_clean": 0.12894610557220595,
        "tmean_rel": 0.11382361130075035,
        "n0_flip": 48,
        "n_clean": 212,
        "over_clean": 146
      },
      {
        "pair": "r25->r26",
        "tmean_clean": 0.16621233894029663,
        "tmean_rel": 0.13871191776559358,
        "n0_flip": 48,
        "n_clean": 212,
        "over_clean": 168
      },
      {
        "pair": "r26->r27",
        "tmean_clean": 0.3031350099173319,
        "tmean_rel": 0.26152689007794516,
        "n0_flip": 49,
        "n_clean": 211,
        "over_clean": 172
      },
      {
        "pair": "r27->r28",
        "tmean_clean": 0.5637510990252235,
        "tmean_rel": 0.4314094748517334,
        "n0_flip": 46,
        "n_clean": 214,
        "over_clean": 192
      },
      {
        "pair": "r28->r29",
        "tmean_clean": 0.19546284908024117,
        "tmean_rel": 0.1725529266995185,
        "n0_flip": 51,
        "n_clean": 209,
        "over_clean": 162
      },
      {
        "pair": "r29->r30",
        "tmean_clean": 0.13862517398183977,
        "tmean_rel": 0.12379980143312935,
        "n0_flip": 55,
        "n_clean": 205,
        "over_clean": 141
      },
      {
        "pair": "r30->r31",
        "tmean_clean": 0.13253494184535855,
        "tmean_rel": 0.14426073776295134,
        "n0_flip": 51,
        "n_clean": 209,
        "over_clean": 126
      },
      {
        "pair": "r31->r32",
        "tmean_clean": 0.18621260226791006,
        "tmean_rel": 0.15998423113846433,
        "n0_flip": 40,
        "n_clean": 220,
        "over_clean": 175
      },
      {
        "pair": "r32->r33",
        "tmean_clean": 0.18135746383779572,
        "tmean_rel": 0.16661469242766078,
        "n0_flip": 45,
        "n_clean": 215,
        "over_clean": 162
      },
      {
        "pair": "r33->r34",
        "tmean_clean": 0.17898587286031145,
        "tmean_rel": 0.14732472056583745,
        "n0_flip": 44,
        "n_clean": 216,
        "over_clean": 157
      },
      {
        "pair": "r34->r35",
        "tmean_clean": 0.2102374851059732,
        "tmean_rel": 0.18370319837395746,
        "n0_flip": 46,
        "n_clean": 214,
        "over_clean": 175
      },
      {
        "pair": "r35->r36",
        "tmean_clean": 0.19244299439127,
        "tmean_rel": 0.15732938686254316,
        "n0_flip": 40,
        "n_clean": 220,
        "over_clean": 164
      },
      {
        "pair": "r36->r37",
        "tmean_clean": 0.15320331991737157,
        "tmean_rel": 0.13212709238110817,
        "n0_flip": 45,
        "n_clean": 215,
        "over_clean": 159
      },
      {
        "pair": "r37->r38",
        "tmean_clean": 0.11730916811724311,
        "tmean_rel": 0.11739307030492249,
        "n0_flip": 50,
        "n_clean": 210,
        "over_clean": 130
      },
      {
        "pair": "r38->r39",
        "tmean_clean": 0.1978849360193365,
        "tmean_rel": 0.19322380733262878,
        "n0_flip": 50,
        "n_clean": 210,
        "over_clean": 159
      },
      {
        "pair": "r39->r40",
        "tmean_clean": 0.18853111640933073,
        "tmean_rel": 0.22879128167544208,
        "n0_flip": 55,
        "n_clean": 205,
        "over_clean": 142
      }
    ],
    "pre_v3_2_archive": [
      {
        "pair": "r0->r1",
        "tmean_clean": null,
        "tmean_rel": 0.1255164337484897,
        "n0_flip": null
      },
      {
        "pair": "r1->r2",
        "tmean_clean": null,
        "tmean_rel": 0.1074881213505348,
        "n0_flip": null
      },
      {
        "pair": "r2->r3",
        "tmean_clean": null,
        "tmean_rel": 0.10488702931027973,
        "n0_flip": null
      },
      {
        "pair": "r3->r4",
        "tmean_clean": null,
        "tmean_rel": 0.17026329845280327,
        "n0_flip": null
      },
      {
        "pair": "r4->r5",
        "tmean_clean": null,
        "tmean_rel": 0.2436221926435666,
        "n0_flip": null
      },
      {
        "pair": "r5->r6",
        "tmean_clean": null,
        "tmean_rel": 0.3175984523801517,
        "n0_flip": null
      },
      {
        "pair": "r6->r7",
        "tmean_clean": 0.21994540694998424,
        "tmean_rel": 0.17973919180882825,
        "n0_flip": 61
      },
      {
        "pair": "r7->r8",
        "tmean_clean": 0.19898449914342856,
        "tmean_rel": 0.1593935658571341,
        "n0_flip": 67
      },
      {
        "pair": "r8->r9",
        "tmean_clean": 0.22248010691030334,
        "tmean_rel": 0.219721659758363,
        "n0_flip": 66
      },
      {
        "pair": "r9->r10",
        "tmean_clean": 0.1570663883052538,
        "tmean_rel": 0.1380357623326577,
        "n0_flip": 52
      },
      {
        "pair": "r10->r11",
        "tmean_clean": 0.15949777806688722,
        "tmean_rel": 0.13283423890952015,
        "n0_flip": 51
      },
      {
        "pair": "r11->r12",
        "tmean_clean": 0.27721117738367773,
        "tmean_rel": 0.2532452925051025,
        "n0_flip": 58
      },
      {
        "pair": "r12->r13",
        "tmean_clean": 0.20519304108135178,
        "tmean_rel": 0.24115541511143077,
        "n0_flip": 70
      },
      {
        "pair": "r13->r14",
        "tmean_clean": 0.27504477443406355,
        "tmean_rel": 0.3042727960288155,
        "n0_flip": 68
      },
      {
        "pair": "r14->r15",
        "tmean_clean": 0.35070631486377946,
        "tmean_rel": 0.28221245978929443,
        "n0_flip": 57
      },
      {
        "pair": "r15->r16",
        "tmean_clean": 0.7908239323660623,
        "tmean_rel": 0.6564517205351137,
        "n0_flip": 63
      },
      {
        "pair": "r16->r17",
        "tmean_clean": 0.2990889675226553,
        "tmean_rel": 0.2769478810147933,
        "n0_flip": 71
      },
      {
        "pair": "r17->r18",
        "tmean_clean": 0.31589876544460815,
        "tmean_rel": 0.3235790404134444,
        "n0_flip": 70
      },
      {
        "pair": "r18->r19",
        "tmean_clean": 0.24036273963945312,
        "tmean_rel": 0.2927646639967077,
        "n0_flip": 69
      },
      {
        "pair": "r19->r20",
        "tmean_clean": 0.3164800117186526,
        "tmean_rel": 0.27742800259846034,
        "n0_flip": 68
      },
      {
        "pair": "r20->r21",
        "tmean_clean": 0.4415385890273437,
        "tmean_rel": 0.38983739762094166,
        "n0_flip": 63
      },
      {
        "pair": "r21->r22",
        "tmean_clean": 0.17996939002122606,
        "tmean_rel": 0.17226334610989563,
        "n0_flip": 68
      }
    ]
  },
  "v3_final_report": {
    "main_md": "state/aeschool/co-eval-task-001/stage4/final-report-v3-main.md",
    "appendix_stats_md": "state/aeschool/co-eval-task-001/stage4/final-report-v3-appendix-stats.md",
    "bundle_md": "state/aeschool/co-eval-task-001/stage4/final-report-v3-bundle.md",
    "protondrive_folder": "protondrive:co-eval-task-001-final-report-2026-05-20/"
  },
  "notes": {
    "rolling_mean_min_samples": 50,
    "winner_pick_rule": "rolling mean across all rounds, filter n >= 50",
    "phantom_cleanup_applied": true,
    "see_also": [
      "docs/morning-state-2026-05-20.md",
      "docs/v3.1-cyclic-divergence-analysis-2026-05-20.md"
    ]
  }
}