{
  "meta": {
    "source": "Horizon (Orin Labs)",
    "generated_at": "2026-06-17T14:19:47.508488+00:00",
    "note": "Per-task metadata (difficulty + axes) and per-run cases (task id, pass, cost, tokens, time). Same data the leaderboard is derived from."
  },
  "tasks": {
    "108-24-no-recording-sessions-policy-v0": {
      "difficulty": "hard",
      "anticipability": 10,
      "burial_depth": 2731,
      "burial_depth_tokens": 874945,
      "trace_lines": 35392,
      "trace_tokens": 8745718,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "24",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-24",
        "no-recording-policy",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "108-24-no-recording-sessions-policy-v1": {
      "difficulty": "hard",
      "anticipability": 4,
      "burial_depth": 2731,
      "burial_depth_tokens": 874945,
      "trace_lines": 35392,
      "trace_tokens": 8745718,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "24",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-24",
        "no-recording-policy",
        "anticipability-mid",
        "md-low",
        "n-hops-1"
      ]
    },
    "108-24-no-recording-sessions-policy-v2": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 2731,
      "burial_depth_tokens": 874945,
      "trace_lines": 35392,
      "trace_tokens": 8745718,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "24",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-24",
        "no-recording-policy",
        "anticipability-high",
        "md-mid",
        "n-hops-2"
      ]
    },
    "108-24-no-recording-sessions-policy-v3": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 2731,
      "burial_depth_tokens": 874945,
      "trace_lines": 35392,
      "trace_tokens": 8745718,
      "misdirection": "high",
      "n_hops": 3,
      "n_memory_sites": 1,
      "family": "24",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-24",
        "no-recording-policy",
        "anticipability-high",
        "md-high",
        "n-hops-3"
      ]
    },
    "108-25-sibling-name-disambiguation-holden-hayden-v0": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 12663,
      "burial_depth_tokens": 2925348,
      "trace_lines": 35392,
      "trace_tokens": 8745718,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 3,
      "family": "25",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-25",
        "sibling-name",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "108-25-sibling-name-disambiguation-holden-hayden-v1": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 12663,
      "burial_depth_tokens": 2925348,
      "trace_lines": 35392,
      "trace_tokens": 8745718,
      "misdirection": "low",
      "n_hops": 2,
      "n_memory_sites": 2,
      "family": "25",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-25",
        "sibling-name",
        "anticipability-high",
        "md-low",
        "n-hops-2"
      ]
    },
    "108-25-sibling-name-disambiguation-holden-hayden-v2": {
      "difficulty": "hard",
      "anticipability": 8,
      "burial_depth": 847,
      "burial_depth_tokens": 282876,
      "trace_lines": 35392,
      "trace_tokens": 8745718,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 2,
      "family": "25",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-25",
        "sibling-name",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "108-25-sibling-name-disambiguation-holden-hayden-v3": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 2042,
      "burial_depth_tokens": 665694,
      "trace_lines": 35392,
      "trace_tokens": 8745718,
      "misdirection": "high",
      "n_hops": 3,
      "n_memory_sites": 3,
      "family": "25",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-25",
        "sibling-name",
        "anticipability-high",
        "md-high",
        "n-hops-3"
      ]
    },
    "108-25-sibling-name-disambiguation-holden-hayden-v4": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 3812,
      "burial_depth_tokens": 1071032,
      "trace_lines": 35392,
      "trace_tokens": 8745718,
      "misdirection": "high",
      "n_hops": 4,
      "n_memory_sites": 3,
      "family": "25",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "compositional"
      ],
      "tags": [
        "family-25",
        "sibling-name",
        "anticipability-high",
        "md-high",
        "n-hops-4",
        "compositional"
      ]
    },
    "108-46-math-only-service-scope-progressive-timeline-v0": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 62,
      "burial_depth_tokens": 10545,
      "trace_lines": 35392,
      "trace_tokens": 8745718,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "46",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-46",
        "service-scope",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "108-46-math-only-service-scope-progressive-timeline-v1": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 62,
      "burial_depth_tokens": 10545,
      "trace_lines": 35392,
      "trace_tokens": 8745718,
      "misdirection": "low",
      "n_hops": 2,
      "n_memory_sites": 2,
      "family": "46",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-46",
        "service-scope",
        "anticipability-high",
        "md-low",
        "n-hops-2"
      ]
    },
    "108-46-math-only-service-scope-progressive-timeline-v2": {
      "difficulty": "easy",
      "anticipability": 9,
      "burial_depth": 62,
      "burial_depth_tokens": 10545,
      "trace_lines": 35392,
      "trace_tokens": 8745718,
      "misdirection": "low",
      "n_hops": 3,
      "n_memory_sites": 2,
      "family": "46",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "compositional"
      ],
      "tags": [
        "family-46",
        "service-scope",
        "anticipability-high",
        "md-low",
        "n-hops-3",
        "compositional"
      ]
    },
    "108-47-ai-disclosure-to-teachers-v0": {
      "difficulty": "medium",
      "anticipability": 6,
      "burial_depth": 5095,
      "burial_depth_tokens": 1334360,
      "trace_lines": 35392,
      "trace_tokens": 8745718,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "47",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-47",
        "ai-disclosure",
        "anticipability-mid",
        "md-low",
        "n-hops-1"
      ]
    },
    "108-47-ai-disclosure-to-teachers-v1": {
      "difficulty": "hard",
      "anticipability": 10,
      "burial_depth": 5095,
      "burial_depth_tokens": 1334360,
      "trace_lines": 35392,
      "trace_tokens": 8745718,
      "misdirection": "low",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "47",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-47",
        "ai-disclosure",
        "anticipability-high",
        "md-low",
        "n-hops-2"
      ]
    },
    "108-47-ai-disclosure-to-teachers-v2": {
      "difficulty": "hard",
      "anticipability": 2,
      "burial_depth": 5095,
      "burial_depth_tokens": 1334360,
      "trace_lines": 35392,
      "trace_tokens": 8745718,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "47",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-47",
        "ai-disclosure",
        "anticipability-low",
        "md-mid",
        "n-hops-2"
      ]
    },
    "108-47-ai-disclosure-to-teachers-v3": {
      "difficulty": "hard",
      "anticipability": 3,
      "burial_depth": 5095,
      "burial_depth_tokens": 1334360,
      "trace_lines": 35392,
      "trace_tokens": 8745718,
      "misdirection": "high",
      "n_hops": 3,
      "n_memory_sites": 1,
      "family": "47",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-47",
        "ai-disclosure",
        "anticipability-low",
        "md-high",
        "n-hops-3"
      ]
    },
    "180-08-no-chrome-use-safari-v1": {
      "difficulty": "hard",
      "anticipability": 8,
      "burial_depth": 52130,
      "burial_depth_tokens": 28090354,
      "trace_lines": 63284,
      "trace_tokens": 36379843,
      "misdirection": "mid",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "08",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-08",
        "no-chrome",
        "anticipability-high",
        "md-mid",
        "n-hops-1"
      ]
    },
    "180-08-no-chrome-use-safari-v2": {
      "difficulty": "easy",
      "anticipability": 9,
      "burial_depth": 52130,
      "burial_depth_tokens": 28090354,
      "trace_lines": 63284,
      "trace_tokens": 36379843,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "08",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-08",
        "no-chrome",
        "anticipability-high",
        "md-mid",
        "n-hops-2"
      ]
    },
    "180-09-brother-nastori-recall-v0": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 299,
      "burial_depth_tokens": 143221,
      "trace_lines": 63284,
      "trace_tokens": 36379843,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "09",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-09",
        "brother-nastori",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "180-09-brother-nastori-recall-v1": {
      "difficulty": "hard",
      "anticipability": 8,
      "burial_depth": 298,
      "burial_depth_tokens": 142405,
      "trace_lines": 63284,
      "trace_tokens": 36379843,
      "misdirection": "low",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "09",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-09",
        "brother-nastori",
        "anticipability-high",
        "md-low",
        "n-hops-2"
      ]
    },
    "180-09-brother-nastori-recall-v3": {
      "difficulty": "hard",
      "anticipability": 10,
      "burial_depth": 298,
      "burial_depth_tokens": 142405,
      "trace_lines": 63284,
      "trace_tokens": 36379843,
      "misdirection": "high",
      "n_hops": 3,
      "n_memory_sites": 1,
      "family": "09",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-09",
        "brother-nastori",
        "anticipability-high",
        "md-high",
        "n-hops-3"
      ]
    },
    "180-10-parent-override-directive-v0": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 42212,
      "burial_depth_tokens": 22249017,
      "trace_lines": 63284,
      "trace_tokens": 36379843,
      "misdirection": "high",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "10",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "synthetic-patch"
      ],
      "tags": [
        "family-10",
        "parent-override",
        "anticipability-high",
        "md-high",
        "n-hops-1",
        "synthetic-patch"
      ]
    },
    "180-11-joe-louis-specific-project-recall-v0": {
      "difficulty": "hard",
      "anticipability": 8,
      "burial_depth": 43267,
      "burial_depth_tokens": 22589343,
      "trace_lines": 63284,
      "trace_tokens": 36379843,
      "misdirection": "low",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "11",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-11",
        "joe-louis",
        "anticipability-high",
        "md-low",
        "n-hops-2"
      ]
    },
    "180-11-joe-louis-specific-project-recall-v1": {
      "difficulty": "hard",
      "anticipability": 6,
      "burial_depth": 43267,
      "burial_depth_tokens": 22589343,
      "trace_lines": 63284,
      "trace_tokens": 36379843,
      "misdirection": "low",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "11",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-11",
        "joe-louis",
        "anticipability-mid",
        "md-low",
        "n-hops-2"
      ]
    },
    "180-11-joe-louis-specific-project-recall-v2": {
      "difficulty": "medium",
      "anticipability": 6,
      "burial_depth": 43267,
      "burial_depth_tokens": 22589343,
      "trace_lines": 63284,
      "trace_tokens": 36379843,
      "misdirection": "low",
      "n_hops": 3,
      "n_memory_sites": 1,
      "family": "11",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-11",
        "joe-louis",
        "anticipability-mid",
        "md-low",
        "n-hops-3"
      ]
    },
    "180-38-space-interest-not-animal-v0": {
      "difficulty": "hard",
      "anticipability": 8,
      "burial_depth": 32205,
      "burial_depth_tokens": 19169437,
      "trace_lines": 63284,
      "trace_tokens": 36379843,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "38",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-38",
        "space-interest",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "180-38-space-interest-not-animal-v1": {
      "difficulty": "hard",
      "anticipability": 8,
      "burial_depth": 32205,
      "burial_depth_tokens": 19169437,
      "trace_lines": 63284,
      "trace_tokens": 36379843,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "38",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "constrained-selection"
      ],
      "tags": [
        "family-38",
        "space-interest",
        "anticipability-high",
        "md-mid",
        "n-hops-2",
        "constrained-selection"
      ]
    },
    "180-38-space-interest-not-animal-v2": {
      "difficulty": "hard",
      "anticipability": 8,
      "burial_depth": 32205,
      "burial_depth_tokens": 19169437,
      "trace_lines": 63284,
      "trace_tokens": 36379843,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "38",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "constrained-selection"
      ],
      "tags": [
        "family-38",
        "space-interest",
        "anticipability-high",
        "md-high",
        "n-hops-2",
        "constrained-selection"
      ]
    },
    "180-38-space-interest-not-animal-v3": {
      "difficulty": "hard",
      "anticipability": 8,
      "burial_depth": 32205,
      "burial_depth_tokens": 19169437,
      "trace_lines": 63285,
      "trace_tokens": 36379971,
      "misdirection": "high",
      "n_hops": 3,
      "n_memory_sites": 1,
      "family": "38",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "synthetic-patch",
        "compositional"
      ],
      "tags": [
        "family-38",
        "space-interest",
        "anticipability-high",
        "md-high",
        "n-hops-3",
        "synthetic-patch",
        "compositional"
      ]
    },
    "180-39-vietnamese-glosses-permission-v1": {
      "difficulty": "hard",
      "anticipability": 6,
      "burial_depth": 132,
      "burial_depth_tokens": 36101,
      "trace_lines": 63284,
      "trace_tokens": 36379843,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "39",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-39",
        "vietnamese-gloss",
        "anticipability-mid",
        "md-high",
        "n-hops-2"
      ]
    },
    "180-39-vietnamese-glosses-permission-v2": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 132,
      "burial_depth_tokens": 36101,
      "trace_lines": 63284,
      "trace_tokens": 36379843,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "39",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-39",
        "vietnamese-gloss",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "180-41-vocab-batch-tracking-v0": {
      "difficulty": "medium",
      "anticipability": 7,
      "burial_depth": 54573,
      "burial_depth_tokens": 29755704,
      "trace_lines": 63284,
      "trace_tokens": 36379843,
      "misdirection": "low",
      "n_hops": 2,
      "n_memory_sites": 2,
      "family": "41",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-41",
        "vocab-batch",
        "anticipability-mid",
        "md-low",
        "n-hops-2"
      ]
    },
    "180-41-vocab-batch-tracking-v1": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 54628,
      "burial_depth_tokens": 29811531,
      "trace_lines": 63287,
      "trace_tokens": 36380022,
      "misdirection": "high",
      "n_hops": 3,
      "n_memory_sites": 2,
      "family": "41",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "synthetic-patch"
      ],
      "tags": [
        "family-41",
        "vocab-batch",
        "anticipability-high",
        "md-high",
        "n-hops-3",
        "synthetic-patch"
      ]
    },
    "180-41-vocab-batch-tracking-v2": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 54573,
      "burial_depth_tokens": 29755704,
      "trace_lines": 63284,
      "trace_tokens": 36379843,
      "misdirection": "low",
      "n_hops": 2,
      "n_memory_sites": 2,
      "family": "41",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-41",
        "vocab-batch",
        "anticipability-high",
        "md-low",
        "n-hops-2"
      ]
    },
    "180-41-vocab-batch-tracking-v3": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 56276,
      "burial_depth_tokens": 31376269,
      "trace_lines": 63284,
      "trace_tokens": 36379843,
      "misdirection": "high",
      "n_hops": 3,
      "n_memory_sites": 2,
      "family": "41",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-41",
        "vocab-batch",
        "anticipability-high",
        "md-high",
        "n-hops-3"
      ]
    },
    "197-48-weekly-subject-schedule-v0": {
      "difficulty": "easy",
      "anticipability": 8,
      "burial_depth": 9127,
      "burial_depth_tokens": 5659053,
      "trace_lines": 116968,
      "trace_tokens": 31658230,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "48",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-48",
        "weekly-schedule",
        "thursday-spanish",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "197-48-weekly-subject-schedule-v4": {
      "difficulty": "hard",
      "anticipability": 8,
      "burial_depth": 9127,
      "burial_depth_tokens": 5659053,
      "trace_lines": 116970,
      "trace_tokens": 31658402,
      "misdirection": "high",
      "n_hops": 3,
      "n_memory_sites": 2,
      "family": "48",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "synthetic-patch"
      ],
      "tags": [
        "family-48",
        "weekly-schedule",
        "one-off-vs-standing",
        "synthetic-patch",
        "anticipability-high",
        "md-high",
        "n-hops-3"
      ]
    },
    "197-49-test-format-question-count-v0": {
      "difficulty": "hard",
      "anticipability": 8,
      "burial_depth": 36801,
      "burial_depth_tokens": 20178996,
      "trace_lines": 116970,
      "trace_tokens": 31658424,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "49",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-49",
        "amc8-format",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "197-49-test-format-question-count-v1": {
      "difficulty": "medium",
      "anticipability": 8,
      "burial_depth": 19661,
      "burial_depth_tokens": 11876803,
      "trace_lines": 116968,
      "trace_tokens": 31658230,
      "misdirection": "mid",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "49",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-49",
        "staar-math-format",
        "anticipability-high",
        "md-mid",
        "n-hops-1"
      ]
    },
    "197-49-test-format-question-count-v2": {
      "difficulty": "hard",
      "anticipability": 10,
      "burial_depth": 3702,
      "burial_depth_tokens": 2206745,
      "trace_lines": 116968,
      "trace_tokens": 31658230,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "49",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "compositional"
      ],
      "tags": [
        "family-49",
        "uil-extension",
        "compositional",
        "anticipability-high",
        "md-mid",
        "n-hops-2"
      ]
    },
    "197-49-test-format-question-count-v3": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 3702,
      "burial_depth_tokens": 2206745,
      "trace_lines": 116968,
      "trace_tokens": 31658230,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "49",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "family-confusion"
      ],
      "tags": [
        "family-49",
        "family-confusion",
        "wrong-confident-uncle",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "197-49-test-format-question-count-v4": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 36801,
      "burial_depth_tokens": 20178996,
      "trace_lines": 116970,
      "trace_tokens": 31658424,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "49",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-49",
        "amc8-format",
        "coach-pressure",
        "new-stakeholder",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "197-51-eighty-percent-word-problem-mix-v0": {
      "difficulty": "medium",
      "anticipability": 6,
      "burial_depth": 18312,
      "burial_depth_tokens": 10809993,
      "trace_lines": 116968,
      "trace_tokens": 31658230,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "51",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-51",
        "word-problem-mix",
        "anticipability-mid",
        "md-low",
        "n-hops-1"
      ]
    },
    "197-51-eighty-percent-word-problem-mix-v1": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 18312,
      "burial_depth_tokens": 10809993,
      "trace_lines": 116968,
      "trace_tokens": 31658230,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "51",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-51",
        "word-problem-mix",
        "new-stakeholder",
        "co-tutor",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "197-51-eighty-percent-word-problem-mix-v4": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 18312,
      "burial_depth_tokens": 10809993,
      "trace_lines": 116968,
      "trace_tokens": 31658230,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "51",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "family-confusion"
      ],
      "tags": [
        "family-51",
        "family-confusion",
        "wrong-confident-grandmother",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "202-84-ela-report-card-link-recency-v1": {
      "difficulty": "hard",
      "anticipability": 10,
      "burial_depth": 2783,
      "burial_depth_tokens": 1195531,
      "trace_lines": 23857,
      "trace_tokens": 8195620,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "84",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-84",
        "report-card-recency",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "202-85-homework-song-titles-fidelity-v0": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 14498,
      "burial_depth_tokens": 5592641,
      "trace_lines": 23858,
      "trace_tokens": 8195710,
      "misdirection": "mid",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "85",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "synthetic-patch"
      ],
      "tags": [
        "family-85",
        "song-titles-fidelity",
        "anticipability-high",
        "md-mid",
        "n-hops-1",
        "synthetic-patch"
      ]
    },
    "202-85-homework-song-titles-fidelity-v2": {
      "difficulty": "medium",
      "anticipability": 8,
      "burial_depth": 14498,
      "burial_depth_tokens": 5592641,
      "trace_lines": 23857,
      "trace_tokens": 8195620,
      "misdirection": "high",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "85",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "constrained-selection"
      ],
      "tags": [
        "family-85",
        "song-titles-fidelity",
        "anticipability-high",
        "md-high",
        "n-hops-1",
        "constrained-selection"
      ]
    },
    "214-30-original-scope-recall-v0": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 77,
      "burial_depth_tokens": 17795,
      "trace_lines": 19001,
      "trace_tokens": 10164473,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "30",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-30",
        "original-scope",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "214-30-original-scope-recall-v2": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 77,
      "burial_depth_tokens": 17795,
      "trace_lines": 19001,
      "trace_tokens": 10164473,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "30",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-30",
        "original-scope",
        "family-member-confusion",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "214-30-original-scope-recall-v3": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 77,
      "burial_depth_tokens": 17795,
      "trace_lines": 19001,
      "trace_tokens": 10164473,
      "misdirection": "high",
      "n_hops": 3,
      "n_memory_sites": 2,
      "family": "30",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "compositional"
      ],
      "tags": [
        "family-30",
        "original-scope",
        "compositional",
        "school-counselor",
        "anticipability-high",
        "md-high",
        "n-hops-3"
      ]
    },
    "214-97-operator-pause-until-paid-upgrade-v0": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 2007,
      "burial_depth_tokens": 1989828,
      "trace_lines": 19001,
      "trace_tokens": 10164473,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 2,
      "family": "97",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-97",
        "operator-directive",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "214-97-operator-pause-until-paid-upgrade-v1": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 2010,
      "burial_depth_tokens": 1991189,
      "trace_lines": 19001,
      "trace_tokens": 10164473,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "97",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-97",
        "operator-directive",
        "wrong-confident-parent",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "216-22-wednesday-extended-slot-progressive-v2": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 425,
      "burial_depth_tokens": 153680,
      "trace_lines": 23247,
      "trace_tokens": 7518865,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 2,
      "family": "22",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "compositional"
      ],
      "tags": [
        "family-22",
        "wed-extended-slot",
        "compositional",
        "audit",
        "anticipability-high",
        "md-mid",
        "n-hops-2"
      ]
    },
    "216-22-wednesday-extended-slot-progressive-v3": {
      "difficulty": "hard",
      "anticipability": 10,
      "burial_depth": 8901,
      "burial_depth_tokens": 4877683,
      "trace_lines": 23249,
      "trace_tokens": 7519031,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "22",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "synthetic-patch"
      ],
      "tags": [
        "family-22",
        "wed-extended-slot",
        "synthetic-patch",
        "latest-state",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "216-22-wednesday-extended-slot-progressive-v4": {
      "difficulty": "hard",
      "anticipability": 10,
      "burial_depth": 8901,
      "burial_depth_tokens": 4877683,
      "trace_lines": 23249,
      "trace_tokens": 7519031,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "22",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "synthetic-patch",
        "family-confusion",
        "wrong-confident"
      ],
      "tags": [
        "family-22",
        "wed-extended-slot",
        "synthetic-patch",
        "family-confusion",
        "wrong-confident",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "216-23-45-min-session-length-commitment-v0": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 425,
      "burial_depth_tokens": 153680,
      "trace_lines": 23247,
      "trace_tokens": 7518865,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "23",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "session-length"
      ],
      "tags": [
        "family-23",
        "session-length",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "216-23-45-min-session-length-commitment-v1": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 425,
      "burial_depth_tokens": 153680,
      "trace_lines": 23247,
      "trace_tokens": 7518865,
      "misdirection": "high",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "23",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "session-length",
        "wrong-confident"
      ],
      "tags": [
        "family-23",
        "session-length",
        "wrong-confident",
        "trace-failure-mode",
        "anticipability-high",
        "md-high",
        "n-hops-1"
      ]
    },
    "216-23-45-min-session-length-commitment-v2": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 425,
      "burial_depth_tokens": 153680,
      "trace_lines": 23247,
      "trace_tokens": 7518865,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "23",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "session-length",
        "new-stakeholder"
      ],
      "tags": [
        "family-23",
        "session-length",
        "new-stakeholder",
        "billing-audit",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "216-23-45-min-session-length-commitment-v3": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 425,
      "burial_depth_tokens": 153680,
      "trace_lines": 23247,
      "trace_tokens": 7518865,
      "misdirection": "mid",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "23",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "session-length",
        "constrained-selection"
      ],
      "tags": [
        "family-23",
        "session-length",
        "constrained-selection",
        "anticipability-high",
        "md-mid",
        "n-hops-1"
      ]
    },
    "216-23-45-min-session-length-commitment-v4": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 423,
      "burial_depth_tokens": 152327,
      "trace_lines": 23247,
      "trace_tokens": 7518865,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 2,
      "family": "23",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "session-length",
        "family-confusion",
        "compositional",
        "wrong-confident"
      ],
      "tags": [
        "family-23",
        "session-length",
        "family-confusion",
        "compositional",
        "wrong-confident",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "219-73-juliana-is-the-parent-adult-learner-v0": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 48,
      "burial_depth_tokens": 10502,
      "trace_lines": 24538,
      "trace_tokens": 38797593,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 2,
      "family": "73",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-73",
        "juliana-adult-learner",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "219-73-juliana-is-the-parent-adult-learner-v1": {
      "difficulty": "medium",
      "anticipability": 2,
      "burial_depth": 48,
      "burial_depth_tokens": 10502,
      "trace_lines": 24538,
      "trace_tokens": 38797593,
      "misdirection": "high",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "73",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "wrong-confident"
      ],
      "tags": [
        "family-73",
        "juliana-adult-learner",
        "anticipability-low",
        "md-high",
        "n-hops-1",
        "wrong-confident"
      ]
    },
    "219-73-juliana-is-the-parent-adult-learner-v2": {
      "difficulty": "hard",
      "anticipability": 10,
      "burial_depth": 48,
      "burial_depth_tokens": 10502,
      "trace_lines": 24538,
      "trace_tokens": 38797593,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "73",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-73",
        "juliana-adult-learner",
        "family-member-confusion",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "219-76-department-of-war-not-defense-v3": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 20304,
      "burial_depth_tokens": 17871515,
      "trace_lines": 24539,
      "trace_tokens": 38797717,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "76",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-76",
        "department-of-war",
        "synthetic-patch-nuance",
        "anticipability-high",
        "md-mid",
        "n-hops-2"
      ]
    },
    "219-86-lecun-feifei-researcher-pair-v0": {
      "difficulty": "easy",
      "anticipability": 9,
      "burial_depth": 16637,
      "burial_depth_tokens": 10255466,
      "trace_lines": 24538,
      "trace_tokens": 38797593,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "86",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-86",
        "researcher-pair",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "219-86-lecun-feifei-researcher-pair-v2": {
      "difficulty": "easy",
      "anticipability": 8,
      "burial_depth": 16637,
      "burial_depth_tokens": 10255466,
      "trace_lines": 24538,
      "trace_tokens": 38797593,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "86",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-86",
        "researcher-pair",
        "new-stakeholder",
        "anticipability-high",
        "md-mid",
        "n-hops-2"
      ]
    },
    "219-87-gavin-logout-was-parent-device-switch-v0": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 24476,
      "burial_depth_tokens": 38774104,
      "trace_lines": 24538,
      "trace_tokens": 38797593,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "87",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-87",
        "gavin-logout",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "219-89-earth-day-totoro-spec-v0": {
      "difficulty": "easy",
      "anticipability": 9,
      "burial_depth": 24232,
      "burial_depth_tokens": 38585427,
      "trace_lines": 24538,
      "trace_tokens": 38797593,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "89",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-89",
        "earth-day-totoro",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "219-89-earth-day-totoro-spec-v1": {
      "difficulty": "easy",
      "anticipability": 9,
      "burial_depth": 24232,
      "burial_depth_tokens": 38585427,
      "trace_lines": 24538,
      "trace_tokens": 38797593,
      "misdirection": "mid",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "89",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "constrained-selection"
      ],
      "tags": [
        "family-89",
        "earth-day-totoro",
        "constrained-selection",
        "anticipability-high",
        "md-mid",
        "n-hops-1"
      ]
    },
    "219-89-earth-day-totoro-spec-v2": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 24232,
      "burial_depth_tokens": 38585427,
      "trace_lines": 24538,
      "trace_tokens": 38797593,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "89",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-89",
        "earth-day-totoro",
        "wrong-confident-parent",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "219-89-earth-day-totoro-spec-v3": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 24232,
      "burial_depth_tokens": 38585427,
      "trace_lines": 24538,
      "trace_tokens": 38797593,
      "misdirection": "mid",
      "n_hops": 3,
      "n_memory_sites": 2,
      "family": "89",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "compositional"
      ],
      "tags": [
        "family-89",
        "earth-day-totoro",
        "compositional",
        "curriculum-tie",
        "anticipability-high",
        "md-mid",
        "n-hops-3"
      ]
    },
    "268-69-aditi-30-minute-sessions-v0": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 8069,
      "burial_depth_tokens": 3886024,
      "trace_lines": 17137,
      "trace_tokens": 41034119,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "69",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "session-length"
      ],
      "tags": [
        "family-69",
        "session-length",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "268-69-aditi-30-minute-sessions-v2": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 8069,
      "burial_depth_tokens": 3886024,
      "trace_lines": 17138,
      "trace_tokens": 41034203,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "69",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "session-length",
        "family-confusion"
      ],
      "tags": [
        "family-69",
        "session-length",
        "family-confusion",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "268-72-pia-traveling-overseas-india-v2": {
      "difficulty": "medium",
      "anticipability": 8,
      "burial_depth": 13411,
      "burial_depth_tokens": 6653033,
      "trace_lines": 17137,
      "trace_tokens": 41034119,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 2,
      "family": "72",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-72",
        "overseas-channel",
        "wrong-stakeholder",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "268-72-pia-traveling-overseas-india-v3": {
      "difficulty": "medium",
      "anticipability": 8,
      "burial_depth": 13411,
      "burial_depth_tokens": 6653033,
      "trace_lines": 17138,
      "trace_tokens": 41034226,
      "misdirection": "mid",
      "n_hops": 3,
      "n_memory_sites": 3,
      "family": "72",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "synthetic-patch"
      ],
      "tags": [
        "family-72",
        "overseas-channel",
        "return-date",
        "synthetic-patch",
        "anticipability-high",
        "md-mid",
        "n-hops-3"
      ]
    },
    "268-91-module-6-two-step-equations-wednesday-test-v0": {
      "difficulty": "hard",
      "anticipability": 8,
      "burial_depth": 11865,
      "burial_depth_tokens": 5924553,
      "trace_lines": 17137,
      "trace_tokens": 41034119,
      "misdirection": "mid",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "91",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-91",
        "module-6",
        "two-step-equations",
        "anticipability-high",
        "md-mid",
        "n-hops-1"
      ]
    },
    "268-91-module-6-two-step-equations-wednesday-test-v1": {
      "difficulty": "hard",
      "anticipability": 8,
      "burial_depth": 11141,
      "burial_depth_tokens": 5495161,
      "trace_lines": 17137,
      "trace_tokens": 41034119,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "91",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-91",
        "module-6",
        "two-step-equations",
        "new-stakeholder",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "268-91-module-6-two-step-equations-wednesday-test-v2": {
      "difficulty": "hard",
      "anticipability": 8,
      "burial_depth": 11865,
      "burial_depth_tokens": 5924553,
      "trace_lines": 17138,
      "trace_tokens": 41034210,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "91",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "family-confusion"
      ],
      "tags": [
        "family-91",
        "module-6",
        "two-step-equations",
        "family-confusion",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "268-92-amc8-test-date-jan-25-2026-v0": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 494,
      "burial_depth_tokens": 188299,
      "trace_lines": 17137,
      "trace_tokens": 41034119,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "92",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-92",
        "amc8-date",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "268-92-amc8-test-date-jan-25-2026-v1": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 494,
      "burial_depth_tokens": 188299,
      "trace_lines": 17137,
      "trace_tokens": 41034119,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "92",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-92",
        "amc8-date",
        "new-stakeholder",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "268-92-amc8-test-date-jan-25-2026-v2": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 5001,
      "burial_depth_tokens": 2367914,
      "trace_lines": 17138,
      "trace_tokens": 41034235,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "92",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "compositional"
      ],
      "tags": [
        "family-92",
        "amc8-date",
        "compositional",
        "parent-chosen-date",
        "anticipability-high",
        "md-mid",
        "n-hops-2"
      ]
    },
    "268-92-amc8-test-date-jan-25-2026-v3": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 494,
      "burial_depth_tokens": 188299,
      "trace_lines": 17138,
      "trace_tokens": 41034226,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "92",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "family-confusion"
      ],
      "tags": [
        "family-92",
        "amc8-date",
        "family-confusion",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "294-52-chloe-regular-slot-mwf-430-v0": {
      "difficulty": "easy",
      "anticipability": 9,
      "burial_depth": 12099,
      "burial_depth_tokens": 6336719,
      "trace_lines": 27756,
      "trace_tokens": 10488074,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "52",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-52",
        "chloe-schedule",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "294-52-chloe-regular-slot-mwf-430-v1": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 12099,
      "burial_depth_tokens": 6336719,
      "trace_lines": 27756,
      "trace_tokens": 10488074,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "52",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-52",
        "chloe-schedule",
        "new-stakeholder",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "294-52-chloe-regular-slot-mwf-430-v2": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 12099,
      "burial_depth_tokens": 6336719,
      "trace_lines": 27756,
      "trace_tokens": 10488074,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 2,
      "family": "52",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-52",
        "chloe-schedule",
        "wrong-confident-parent",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "294-52-chloe-regular-slot-mwf-430-v3": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 4844,
      "burial_depth_tokens": 2065583,
      "trace_lines": 27756,
      "trace_tokens": 10488074,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 2,
      "family": "52",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "compositional"
      ],
      "tags": [
        "family-52",
        "chloe-schedule",
        "compositional",
        "both-kids",
        "anticipability-high",
        "md-mid",
        "n-hops-2"
      ]
    },
    "294-52-chloe-regular-slot-mwf-430-v4": {
      "difficulty": "hard",
      "anticipability": 10,
      "burial_depth": 12099,
      "burial_depth_tokens": 6336719,
      "trace_lines": 27756,
      "trace_tokens": 10488074,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 2,
      "family": "52",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "family-confusion"
      ],
      "tags": [
        "family-52",
        "chloe-schedule",
        "family-confusion",
        "wrong-confident-relative",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "294-53-carmindy-precal-not-trig-v0": {
      "difficulty": "easy",
      "anticipability": 9,
      "burial_depth": 7979,
      "burial_depth_tokens": 3760618,
      "trace_lines": 27756,
      "trace_tokens": 10488074,
      "misdirection": "mid",
      "n_hops": 1,
      "n_memory_sites": 2,
      "family": "53",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-53",
        "carmindy-precal",
        "anticipability-high",
        "md-mid",
        "n-hops-1"
      ]
    },
    "294-53-carmindy-precal-not-trig-v1": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 7979,
      "burial_depth_tokens": 3760618,
      "trace_lines": 27756,
      "trace_tokens": 10488074,
      "misdirection": "mid",
      "n_hops": 1,
      "n_memory_sites": 2,
      "family": "53",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-53",
        "carmindy-precal",
        "new-stakeholder",
        "email",
        "anticipability-high",
        "md-mid",
        "n-hops-1"
      ]
    },
    "294-53-carmindy-precal-not-trig-v2": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 7979,
      "burial_depth_tokens": 3760618,
      "trace_lines": 27756,
      "trace_tokens": 10488074,
      "misdirection": "high",
      "n_hops": 1,
      "n_memory_sites": 2,
      "family": "53",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "constrained-selection"
      ],
      "tags": [
        "family-53",
        "carmindy-precal",
        "constrained-selection",
        "anticipability-high",
        "md-high",
        "n-hops-1"
      ]
    },
    "294-53-carmindy-precal-not-trig-v3": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 7979,
      "burial_depth_tokens": 3760618,
      "trace_lines": 27757,
      "trace_tokens": 10488179,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "53",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "synthetic-patch",
        "family-confusion"
      ],
      "tags": [
        "family-53",
        "carmindy-precal",
        "synthetic-patch",
        "wrong-confident-relative",
        "family-confusion",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "294-54-williams-referral-code-v0": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 9,
      "burial_depth_tokens": 1064,
      "trace_lines": 27756,
      "trace_tokens": 10488074,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "54",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-54",
        "referral-code",
        "opaque-token",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "294-54-williams-referral-code-v1": {
      "difficulty": "easy",
      "anticipability": 9,
      "burial_depth": 9,
      "burial_depth_tokens": 1064,
      "trace_lines": 27756,
      "trace_tokens": 10488074,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "54",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-54",
        "referral-code",
        "new-stakeholder",
        "opaque-token",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "294-54-williams-referral-code-v2": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 9,
      "burial_depth_tokens": 1064,
      "trace_lines": 27756,
      "trace_tokens": 10488074,
      "misdirection": "high",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "54",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-54",
        "referral-code",
        "wrong-confident-audit",
        "email",
        "anticipability-high",
        "md-high",
        "n-hops-1"
      ]
    },
    "294-80-carmindy-tue-thu-345-415-v0": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 4844,
      "burial_depth_tokens": 2065583,
      "trace_lines": 27756,
      "trace_tokens": 10488074,
      "misdirection": "mid",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "80",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-80",
        "carmindy-schedule",
        "anticipability-high",
        "md-mid",
        "n-hops-1"
      ]
    },
    "294-80-carmindy-tue-thu-345-415-v1": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 4844,
      "burial_depth_tokens": 2065583,
      "trace_lines": 27756,
      "trace_tokens": 10488074,
      "misdirection": "mid",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "80",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-80",
        "carmindy-schedule",
        "new-stakeholder",
        "email",
        "anticipability-high",
        "md-mid",
        "n-hops-1"
      ]
    },
    "294-80-carmindy-tue-thu-345-415-v2": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 27757,
      "burial_depth_tokens": 10488075,
      "trace_lines": 27757,
      "trace_tokens": 10488178,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "80",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "synthetic-patch"
      ],
      "tags": [
        "family-80",
        "carmindy-schedule",
        "synthetic-patch",
        "patched-state",
        "anticipability-high",
        "md-mid",
        "n-hops-2"
      ]
    },
    "294-80-carmindy-tue-thu-345-415-v3": {
      "difficulty": "medium",
      "anticipability": 8,
      "burial_depth": 4844,
      "burial_depth_tokens": 2065583,
      "trace_lines": 27756,
      "trace_tokens": 10488074,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 2,
      "family": "80",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-80",
        "carmindy-schedule",
        "sister-confusion",
        "wrong-confident-relative",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "294-80-carmindy-tue-thu-345-415-v4": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 4844,
      "burial_depth_tokens": 2065583,
      "trace_lines": 27756,
      "trace_tokens": 10488074,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 2,
      "family": "80",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "compositional"
      ],
      "tags": [
        "family-80",
        "carmindy-schedule",
        "compositional",
        "both-kids",
        "operator-audit",
        "email",
        "anticipability-high",
        "md-mid",
        "n-hops-2"
      ]
    },
    "304-12-test-mode-directive-recall-v0": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 27781,
      "burial_depth_tokens": 16381351,
      "trace_lines": 40571,
      "trace_tokens": 28638069,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "12",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-12",
        "test-mode",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "304-12-test-mode-directive-recall-v1": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 27762,
      "burial_depth_tokens": 16373684,
      "trace_lines": 40571,
      "trace_tokens": 28638069,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "12",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-12",
        "test-mode",
        "anticipability-high",
        "md-mid",
        "n-hops-2"
      ]
    },
    "304-12-test-mode-directive-recall-v2": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 27762,
      "burial_depth_tokens": 16373684,
      "trace_lines": 40571,
      "trace_tokens": 28638069,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "12",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "constrained-selection"
      ],
      "tags": [
        "family-12",
        "test-mode",
        "anticipability-high",
        "md-high",
        "n-hops-2",
        "constrained-selection"
      ]
    },
    "304-12-test-mode-directive-recall-v3": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 27762,
      "burial_depth_tokens": 16373684,
      "trace_lines": 40571,
      "trace_tokens": 28638069,
      "misdirection": "high",
      "n_hops": 3,
      "n_memory_sites": 1,
      "family": "12",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "compositional"
      ],
      "tags": [
        "family-12",
        "test-mode",
        "anticipability-high",
        "md-high",
        "n-hops-3",
        "compositional"
      ]
    },
    "304-13-stale-schedule-vs-actual-pattern-v0": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 12223,
      "burial_depth_tokens": 7753937,
      "trace_lines": 40571,
      "trace_tokens": 28638069,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 3,
      "family": "13",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-13",
        "stale-schedule",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "304-13-stale-schedule-vs-actual-pattern-v3": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 40572,
      "burial_depth_tokens": 28638070,
      "trace_lines": 40574,
      "trace_tokens": 28638300,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "13",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "synthetic-patch"
      ],
      "tags": [
        "family-13",
        "stale-schedule",
        "anticipability-high",
        "md-high",
        "n-hops-2",
        "latest-wins",
        "synthetic-patch"
      ]
    },
    "304-14-numerator-denominator-taxonomy-v0": {
      "difficulty": "medium",
      "anticipability": 8,
      "burial_depth": 12001,
      "burial_depth_tokens": 7608872,
      "trace_lines": 40571,
      "trace_tokens": 28638069,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "14",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-14",
        "error-taxonomy",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "304-14-numerator-denominator-taxonomy-v2": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 11283,
      "burial_depth_tokens": 7244161,
      "trace_lines": 40571,
      "trace_tokens": 28638069,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 2,
      "family": "14",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-14",
        "error-taxonomy",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "304-15-shadow-compass-remediation-v0": {
      "difficulty": "easy",
      "anticipability": 9,
      "burial_depth": 37262,
      "burial_depth_tokens": 25306606,
      "trace_lines": 40571,
      "trace_tokens": 28638069,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "15",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-15",
        "shadow-compass",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "304-15-shadow-compass-remediation-v1": {
      "difficulty": "easy",
      "anticipability": 6,
      "burial_depth": 37262,
      "burial_depth_tokens": 25306606,
      "trace_lines": 40571,
      "trace_tokens": 28638069,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "15",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "wrong-confident"
      ],
      "tags": [
        "family-15",
        "shadow-compass",
        "anticipability-mid",
        "md-mid",
        "n-hops-2",
        "wrong-confident"
      ]
    },
    "350-34-mon-thu-5pm-schedule-correction-v0": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 11828,
      "burial_depth_tokens": 4281252,
      "trace_lines": 16439,
      "trace_tokens": 5540963,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "34",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-34",
        "schedule-correction",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "350-34-mon-thu-5pm-schedule-correction-v1": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 11828,
      "burial_depth_tokens": 4281252,
      "trace_lines": 16439,
      "trace_tokens": 5540963,
      "misdirection": "low",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "34",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-34",
        "schedule-correction",
        "new-stakeholder",
        "anticipability-high",
        "md-low",
        "n-hops-2"
      ]
    },
    "350-34-mon-thu-5pm-schedule-correction-v3": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 11828,
      "burial_depth_tokens": 4281252,
      "trace_lines": 16439,
      "trace_tokens": 5540963,
      "misdirection": "high",
      "n_hops": 3,
      "n_memory_sites": 1,
      "family": "34",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-34",
        "schedule-correction",
        "family-member-confusion",
        "anticipability-high",
        "md-high",
        "n-hops-3"
      ]
    },
    "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 7477,
      "burial_depth_tokens": 3357547,
      "trace_lines": 16439,
      "trace_tokens": 5540963,
      "misdirection": "low",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "94",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-94",
        "teacher-email",
        "anticipability-high",
        "md-low",
        "n-hops-2"
      ]
    },
    "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 7477,
      "burial_depth_tokens": 3357547,
      "trace_lines": 16439,
      "trace_tokens": 5540963,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "94",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-94",
        "teacher-email",
        "email-compose",
        "anticipability-high",
        "md-mid",
        "n-hops-2"
      ]
    },
    "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 7459,
      "burial_depth_tokens": 3354183,
      "trace_lines": 16439,
      "trace_tokens": 5540963,
      "misdirection": "high",
      "n_hops": 3,
      "n_memory_sites": 1,
      "family": "94",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-94",
        "teacher-email",
        "family-member-confusion",
        "anticipability-high",
        "md-high",
        "n-hops-3"
      ]
    },
    "350-95-karter-fractions-test-score-84-v0": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 8462,
      "burial_depth_tokens": 3554074,
      "trace_lines": 16439,
      "trace_tokens": 5540963,
      "misdirection": "low",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "95",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-95",
        "test-score-84",
        "anticipability-high",
        "md-low",
        "n-hops-2"
      ]
    },
    "350-95-karter-fractions-test-score-84-v1": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 8462,
      "burial_depth_tokens": 3554074,
      "trace_lines": 16439,
      "trace_tokens": 5540963,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 2,
      "family": "95",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-95",
        "test-score-84",
        "distractor-stress",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "350-96-parent-name-mrs-marsha-suggs-v0": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 6484,
      "burial_depth_tokens": 3165270,
      "trace_lines": 16439,
      "trace_tokens": 5540963,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "96",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-96",
        "parent-name",
        "anticipability-high",
        "md-mid",
        "n-hops-2"
      ]
    },
    "367-61-teaching-textbooks-pre-algebra-v2": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 5411,
      "burial_depth_tokens": 2226292,
      "trace_lines": 17275,
      "trace_tokens": 4602148,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "61",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-61",
        "teaching-textbooks",
        "anticipability-high",
        "md-high",
        "n-hops-2",
        "publisher-detail",
        "new-stakeholder"
      ]
    },
    "367-61-teaching-textbooks-pre-algebra-v3": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 5411,
      "burial_depth_tokens": 2226292,
      "trace_lines": 17275,
      "trace_tokens": 4602148,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "61",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "family-confusion"
      ],
      "tags": [
        "family-61",
        "teaching-textbooks",
        "anticipability-high",
        "md-high",
        "n-hops-2",
        "family-confusion",
        "mirroring-pressure"
      ]
    },
    "367-62-mon-10-tue-fri-11-schedule-v0": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 6275,
      "burial_depth_tokens": 2379918,
      "trace_lines": 17275,
      "trace_tokens": 4602148,
      "misdirection": "mid",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "62",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-62",
        "schedule",
        "anticipability-high",
        "md-mid",
        "n-hops-1",
        "day-dependent-recall"
      ]
    },
    "367-62-mon-10-tue-fri-11-schedule-v3": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 5371,
      "burial_depth_tokens": 2210616,
      "trace_lines": 17275,
      "trace_tokens": 4602148,
      "misdirection": "high",
      "n_hops": 3,
      "n_memory_sites": 2,
      "family": "62",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "compositional",
        "new-stakeholder"
      ],
      "tags": [
        "family-62",
        "schedule",
        "anticipability-high",
        "md-high",
        "n-hops-3",
        "compositional",
        "full-timeline",
        "new-stakeholder"
      ]
    },
    "367-63-subscription-paused-march-7-v0": {
      "difficulty": "easy",
      "anticipability": 9,
      "burial_depth": 16414,
      "burial_depth_tokens": 4451526,
      "trace_lines": 17275,
      "trace_tokens": 4602148,
      "misdirection": "mid",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "63",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-63",
        "subscription-paused",
        "anticipability-high",
        "md-mid",
        "n-hops-1",
        "date-recall"
      ]
    },
    "367-63-subscription-paused-march-7-v1": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 16414,
      "burial_depth_tokens": 4451526,
      "trace_lines": 17275,
      "trace_tokens": 4602148,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "63",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-63",
        "subscription-paused",
        "anticipability-high",
        "md-high",
        "n-hops-2",
        "new-stakeholder",
        "billing-ops"
      ]
    },
    "367-64-riley-curriculum-mastery-level-v1": {
      "difficulty": "hard",
      "anticipability": 8,
      "burial_depth": 11864,
      "burial_depth_tokens": 3488418,
      "trace_lines": 17275,
      "trace_tokens": 4602148,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 2,
      "family": "64",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "family-confusion"
      ],
      "tags": [
        "family-64",
        "curriculum-mastery",
        "anticipability-high",
        "md-high",
        "n-hops-2",
        "family-confusion",
        "mirroring-pressure"
      ]
    },
    "367-64-riley-curriculum-mastery-level-v2": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 5604,
      "burial_depth_tokens": 2265167,
      "trace_lines": 17275,
      "trace_tokens": 4602148,
      "misdirection": "high",
      "n_hops": 3,
      "n_memory_sites": 3,
      "family": "64",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "compositional",
        "new-stakeholder"
      ],
      "tags": [
        "family-64",
        "curriculum-mastery",
        "anticipability-high",
        "md-high",
        "n-hops-3",
        "compositional",
        "multi-topic",
        "new-stakeholder"
      ]
    },
    "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 24019,
      "burial_depth_tokens": 6920442,
      "trace_lines": 33227,
      "trace_tokens": 8708693,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": null,
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-55b",
        "benaiah-formal-name",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "699-56-nephew-add-to-existing-account-bryan-override-v0": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 30501,
      "burial_depth_tokens": 8392659,
      "trace_lines": 33226,
      "trace_tokens": 8708595,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "56",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-56",
        "nephew-bryan-override",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "699-56-nephew-add-to-existing-account-bryan-override-v1": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 30501,
      "burial_depth_tokens": 8392659,
      "trace_lines": 33226,
      "trace_tokens": 8708595,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "56",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-56",
        "nephew-bryan-override",
        "no-referral-fee",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "699-56-nephew-add-to-existing-account-bryan-override-v3": {
      "difficulty": "medium",
      "anticipability": 8,
      "burial_depth": 30501,
      "burial_depth_tokens": 8392659,
      "trace_lines": 33228,
      "trace_tokens": 8708743,
      "misdirection": "high",
      "n_hops": 3,
      "n_memory_sites": 2,
      "family": "56",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-56",
        "nephew-bryan-override",
        "nuance-patch",
        "compositional-split",
        "anticipability-high",
        "md-high",
        "n-hops-3"
      ]
    },
    "699-78-parent-is-guardian-not-biological-mother-v3": {
      "difficulty": "hard",
      "anticipability": 2,
      "burial_depth": 27010,
      "burial_depth_tokens": 7898944,
      "trace_lines": 33226,
      "trace_tokens": 8708595,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 2,
      "family": "78",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "constrained-selection"
      ],
      "tags": [
        "family-78",
        "guardian-not-mother",
        "constrained-selection",
        "profile-update",
        "anticipability-low",
        "md-high",
        "n-hops-2"
      ]
    },
    "719-32-standing-630-pm-schedule-v0": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 21,
      "burial_depth_tokens": 2460,
      "trace_lines": 27817,
      "trace_tokens": 4023195,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 2,
      "family": "32",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-32",
        "standing-schedule",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "719-32-standing-630-pm-schedule-v1": {
      "difficulty": "easy",
      "anticipability": 9,
      "burial_depth": 4197,
      "burial_depth_tokens": 641770,
      "trace_lines": 27817,
      "trace_tokens": 4023195,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "32",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-32",
        "standing-schedule",
        "new-stakeholder",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "719-32-standing-630-pm-schedule-v2": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 209,
      "burial_depth_tokens": 35949,
      "trace_lines": 27817,
      "trace_tokens": 4023195,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 2,
      "family": "32",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-32",
        "standing-schedule",
        "constrained-menu",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "719-32-standing-630-pm-schedule-v3": {
      "difficulty": "hard",
      "anticipability": 10,
      "burial_depth": 27819,
      "burial_depth_tokens": 4023295,
      "trace_lines": 27819,
      "trace_tokens": 4023380,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "32",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "synthetic-patch",
        "new-stakeholder"
      ],
      "tags": [
        "family-32",
        "standing-schedule",
        "synthetic-patch",
        "new-stakeholder",
        "anticipability-high",
        "md-mid",
        "n-hops-2"
      ]
    },
    "719-33-test-rescheduled-to-monday-v0": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 16085,
      "burial_depth_tokens": 2482943,
      "trace_lines": 27817,
      "trace_tokens": 4023195,
      "misdirection": "mid",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "33",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-33",
        "test-rescheduled",
        "anticipability-high",
        "md-mid",
        "n-hops-1"
      ]
    },
    "719-33-test-rescheduled-to-monday-v3": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 27818,
      "burial_depth_tokens": 4023196,
      "trace_lines": 27819,
      "trace_tokens": 4023352,
      "misdirection": "high",
      "n_hops": 3,
      "n_memory_sites": 1,
      "family": "33",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "synthetic-patch",
        "compositional"
      ],
      "tags": [
        "family-33",
        "test-rescheduled",
        "synthetic-patch",
        "compositional",
        "anticipability-high",
        "md-high",
        "n-hops-3"
      ]
    },
    "732-36-wednesday-5pm-youth-group-override-732-v0": {
      "difficulty": "easy",
      "anticipability": 8,
      "burial_depth": 12198,
      "burial_depth_tokens": 2626529,
      "trace_lines": 23119,
      "trace_tokens": 4222634,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "36",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-36",
        "wed-youth-override",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "732-36-wednesday-5pm-youth-group-override-732-v1": {
      "difficulty": "easy",
      "anticipability": 9,
      "burial_depth": 12198,
      "burial_depth_tokens": 2626529,
      "trace_lines": 23119,
      "trace_tokens": 4222634,
      "misdirection": "mid",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "36",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-36",
        "wed-youth-override",
        "new-stakeholder",
        "anticipability-high",
        "md-mid",
        "n-hops-1"
      ]
    },
    "732-36-wednesday-5pm-youth-group-override-732-v2": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 12198,
      "burial_depth_tokens": 2626529,
      "trace_lines": 23119,
      "trace_tokens": 4222634,
      "misdirection": "mid",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "36",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-36",
        "wed-youth-override",
        "multiple-choice",
        "anticipability-high",
        "md-mid",
        "n-hops-1"
      ]
    },
    "732-36-wednesday-5pm-youth-group-override-732-v3": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 12198,
      "burial_depth_tokens": 2626529,
      "trace_lines": 23119,
      "trace_tokens": 4222634,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "36",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-36",
        "wed-youth-override",
        "wrong-confident-interlocutor",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "732-93-tue-thu-reading-30-writing-20-split-v0": {
      "difficulty": "hard",
      "anticipability": 10,
      "burial_depth": 1140,
      "burial_depth_tokens": 209513,
      "trace_lines": 23119,
      "trace_tokens": 4222634,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "93",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-93",
        "tue-thu-split",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "732-93-tue-thu-reading-30-writing-20-split-v1": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 1140,
      "burial_depth_tokens": 209513,
      "trace_lines": 23119,
      "trace_tokens": 4222634,
      "misdirection": "mid",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "93",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-93",
        "tue-thu-split",
        "new-stakeholder",
        "anticipability-high",
        "md-mid",
        "n-hops-1"
      ]
    },
    "732-93-tue-thu-reading-30-writing-20-split-v3": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 1140,
      "burial_depth_tokens": 209513,
      "trace_lines": 23119,
      "trace_tokens": 4222634,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "93",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-93",
        "tue-thu-split",
        "wrong-confident-interlocutor",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "732-93-tue-thu-reading-30-writing-20-split-v4": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 23120,
      "burial_depth_tokens": 4222635,
      "trace_lines": 23120,
      "trace_tokens": 4222751,
      "misdirection": "high",
      "n_hops": 3,
      "n_memory_sites": 1,
      "family": "93",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "synthetic-patch",
        "new-stakeholder"
      ],
      "tags": [
        "family-93",
        "tue-thu-split",
        "synthetic-patch",
        "new-stakeholder",
        "priority-flip",
        "anticipability-high",
        "md-high",
        "n-hops-3"
      ]
    },
    "745-57-last-kids-on-earth-book-series-v0": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 1181,
      "burial_depth_tokens": 182235,
      "trace_lines": 28386,
      "trace_tokens": 9959976,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "57",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-57",
        "last-kids-on-earth",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "745-57-last-kids-on-earth-book-series-v1": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 1181,
      "burial_depth_tokens": 182235,
      "trace_lines": 28386,
      "trace_tokens": 9959976,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "57",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-57",
        "last-kids-on-earth",
        "new-stakeholder",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "745-57-last-kids-on-earth-book-series-v3": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 1181,
      "burial_depth_tokens": 182235,
      "trace_lines": 28386,
      "trace_tokens": 9959976,
      "misdirection": "low",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "57",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "compositional"
      ],
      "tags": [
        "family-57",
        "last-kids-on-earth",
        "compositional",
        "anticipability-high",
        "md-low",
        "n-hops-2"
      ]
    },
    "745-58-business-name-mini-moments-v0": {
      "difficulty": "easy",
      "anticipability": 9,
      "burial_depth": 1224,
      "burial_depth_tokens": 188640,
      "trace_lines": 28386,
      "trace_tokens": 9959976,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "58",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-58",
        "mini-moments",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "745-58-business-name-mini-moments-v2": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 1224,
      "burial_depth_tokens": 188640,
      "trace_lines": 28386,
      "trace_tokens": 9959976,
      "misdirection": "high",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "58",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "wrong-confident"
      ],
      "tags": [
        "family-58",
        "mini-moments",
        "wrong-confident",
        "anticipability-high",
        "md-high",
        "n-hops-1"
      ]
    },
    "745-59-sessions-mix-in-other-subjects-v1": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 1404,
      "burial_depth_tokens": 274496,
      "trace_lines": 28386,
      "trace_tokens": 9959976,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "59",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-59",
        "mix-other-subjects",
        "new-stakeholder",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "745-60-douglas-homework-1-to-15-and-28-29-v0": {
      "difficulty": "hard",
      "anticipability": 10,
      "burial_depth": 6585,
      "burial_depth_tokens": 1252989,
      "trace_lines": 28386,
      "trace_tokens": 9959976,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "60",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-60",
        "homework-1-15-28-29",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "745-60-douglas-homework-1-to-15-and-28-29-v2": {
      "difficulty": "hard",
      "anticipability": 10,
      "burial_depth": 6585,
      "burial_depth_tokens": 1252989,
      "trace_lines": 28386,
      "trace_tokens": 9959976,
      "misdirection": "high",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "60",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "wrong-confident",
        "family-confusion"
      ],
      "tags": [
        "family-60",
        "homework-1-15-28-29",
        "wrong-confident",
        "family-confusion",
        "anticipability-high",
        "md-high",
        "n-hops-1"
      ]
    },
    "745-60-douglas-homework-1-to-15-and-28-29-v3": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 6585,
      "burial_depth_tokens": 1252989,
      "trace_lines": 28386,
      "trace_tokens": 9959976,
      "misdirection": "low",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "60",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder",
        "compositional"
      ],
      "tags": [
        "family-60",
        "homework-1-15-28-29",
        "new-stakeholder",
        "compositional",
        "anticipability-high",
        "md-low",
        "n-hops-2"
      ]
    },
    "745-81-behavior-reporting-to-therapist-v0": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 9188,
      "burial_depth_tokens": 1886447,
      "trace_lines": 28386,
      "trace_tokens": 9959976,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "81",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-81",
        "therapist-channel",
        "quote-back",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "745-81-behavior-reporting-to-therapist-v1": {
      "difficulty": "hard",
      "anticipability": 10,
      "burial_depth": 9188,
      "burial_depth_tokens": 1886447,
      "trace_lines": 28386,
      "trace_tokens": 9959976,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "81",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-81",
        "therapist-channel",
        "new-stakeholder",
        "anticipability-high",
        "md-mid",
        "n-hops-2"
      ]
    },
    "745-82-doug-tired-claim-is-avoidance-v1": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 8061,
      "burial_depth_tokens": 1575783,
      "trace_lines": 28386,
      "trace_tokens": 9959976,
      "misdirection": "low",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "82",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-82",
        "doug-behavior-patterns",
        "new-stakeholder",
        "anticipability-high",
        "md-low",
        "n-hops-2"
      ]
    },
    "745-82-doug-tired-claim-is-avoidance-v4": {
      "difficulty": "hard",
      "anticipability": 8,
      "burial_depth": 8061,
      "burial_depth_tokens": 1575783,
      "trace_lines": 28386,
      "trace_tokens": 9959976,
      "misdirection": "low",
      "n_hops": 2,
      "n_memory_sites": 2,
      "family": "82",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "compositional"
      ],
      "tags": [
        "family-82",
        "doug-behavior-patterns",
        "compositional",
        "therapist-channel",
        "anticipability-high",
        "md-low",
        "n-hops-2"
      ]
    },
    "745-82-doug-tired-claim-is-avoidance-v5": {
      "difficulty": "easy",
      "anticipability": 6,
      "burial_depth": 2400,
      "burial_depth_tokens": 437690,
      "trace_lines": 28386,
      "trace_tokens": 9959976,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "82",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-82",
        "doug-behavior-patterns",
        "self-application",
        "anticipability-mid",
        "md-mid",
        "n-hops-2"
      ]
    },
    "745-83-no-repitch-human-tutor-v0": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 9579,
      "burial_depth_tokens": 2025463,
      "trace_lines": 28386,
      "trace_tokens": 9959976,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "83",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-83",
        "no-repitch",
        "quote-back",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "745-83-no-repitch-human-tutor-v1": {
      "difficulty": "hard",
      "anticipability": 10,
      "burial_depth": 9610,
      "burial_depth_tokens": 2032486,
      "trace_lines": 28386,
      "trace_tokens": 9959976,
      "misdirection": "high",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "83",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-83",
        "no-repitch",
        "wrong-confident-teammate",
        "anticipability-high",
        "md-high",
        "n-hops-1"
      ]
    },
    "745-83-no-repitch-human-tutor-v4": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 9589,
      "burial_depth_tokens": 2027212,
      "trace_lines": 28386,
      "trace_tokens": 9959976,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "83",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-83",
        "no-repitch",
        "bryan-fresh-ask",
        "hold-line",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "804-27-referral-link-cantave-v0": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 1017,
      "burial_depth_tokens": 171033,
      "trace_lines": 32407,
      "trace_tokens": 7070203,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "27",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-27",
        "referral-link",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "804-27-referral-link-cantave-v1": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 1017,
      "burial_depth_tokens": 171033,
      "trace_lines": 32407,
      "trace_tokens": 7070203,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "27",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-27",
        "referral-link",
        "anticipability-high",
        "md-mid",
        "n-hops-2",
        "new-stakeholder"
      ]
    },
    "804-27-referral-link-cantave-v2": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 1017,
      "burial_depth_tokens": 171033,
      "trace_lines": 32407,
      "trace_tokens": 7070203,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "27",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-27",
        "referral-link",
        "anticipability-high",
        "md-high",
        "n-hops-2",
        "new-stakeholder",
        "audit-framing"
      ]
    },
    "804-27-referral-link-cantave-v3": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 1017,
      "burial_depth_tokens": 171033,
      "trace_lines": 32407,
      "trace_tokens": 7070203,
      "misdirection": "high",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "27",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "constrained-selection"
      ],
      "tags": [
        "family-27",
        "referral-link",
        "anticipability-high",
        "md-high",
        "n-hops-1",
        "constrained-selection",
        "confusables"
      ]
    },
    "804-27-referral-link-cantave-v4": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 32394,
      "burial_depth_tokens": 7066551,
      "trace_lines": 32407,
      "trace_tokens": 7070203,
      "misdirection": "high",
      "n_hops": 3,
      "n_memory_sites": 1,
      "family": "27",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-27",
        "referral-link",
        "anticipability-high",
        "md-high",
        "n-hops-3",
        "wrong-confident-interlocutor"
      ]
    },
    "804-28-parent-email-icloud-recall-v0": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 1224,
      "burial_depth_tokens": 216803,
      "trace_lines": 32407,
      "trace_tokens": 7070203,
      "misdirection": "mid",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "28",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-28",
        "parent-email",
        "anticipability-high",
        "md-mid",
        "n-hops-1",
        "force-email-send"
      ]
    },
    "804-28-parent-email-icloud-recall-v1": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 1224,
      "burial_depth_tokens": 216803,
      "trace_lines": 32407,
      "trace_tokens": 7070203,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "28",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "compositional"
      ],
      "tags": [
        "family-28",
        "parent-email",
        "anticipability-high",
        "md-high",
        "n-hops-2",
        "compositional"
      ]
    },
    "804-28-parent-email-icloud-recall-v2": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 1218,
      "burial_depth_tokens": 215329,
      "trace_lines": 32407,
      "trace_tokens": 7070203,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "28",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-28",
        "parent-email",
        "anticipability-high",
        "md-high",
        "n-hops-2",
        "new-stakeholder",
        "audit-framing"
      ]
    },
    "804-28-parent-email-icloud-recall-v3": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 1218,
      "burial_depth_tokens": 215329,
      "trace_lines": 32407,
      "trace_tokens": 7070203,
      "misdirection": "high",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "28",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "constrained-selection"
      ],
      "tags": [
        "family-28",
        "parent-email",
        "anticipability-high",
        "md-high",
        "n-hops-1",
        "constrained-selection"
      ]
    },
    "804-28-parent-email-icloud-recall-v4": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 1218,
      "burial_depth_tokens": 215329,
      "trace_lines": 32407,
      "trace_tokens": 7070203,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "28",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-28",
        "parent-email",
        "anticipability-high",
        "md-high",
        "n-hops-2",
        "wrong-confident-interlocutor"
      ]
    },
    "804-42-cj-pronouns-he-him-v2": {
      "difficulty": "hard",
      "anticipability": 8,
      "burial_depth": 16644,
      "burial_depth_tokens": 4675478,
      "trace_lines": 32407,
      "trace_tokens": 7070203,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "42",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-42",
        "cj-pronouns",
        "anticipability-high",
        "md-high",
        "n-hops-2",
        "about-cj",
        "new-stakeholder",
        "pronoun-pressure"
      ]
    },
    "804-43-cj-christina-twin-disambiguation-v3": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 15740,
      "burial_depth_tokens": 4415858,
      "trace_lines": 32407,
      "trace_tokens": 7070203,
      "misdirection": "high",
      "n_hops": 1,
      "n_memory_sites": 2,
      "family": "43",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-43",
        "twin-disambiguation",
        "anticipability-high",
        "md-high",
        "n-hops-1",
        "misspelling-routing"
      ]
    },
    "804-43-cj-christina-twin-disambiguation-v4": {
      "difficulty": "medium",
      "anticipability": 7,
      "burial_depth": 4634,
      "burial_depth_tokens": 1217130,
      "trace_lines": 32407,
      "trace_tokens": 7070203,
      "misdirection": "high",
      "n_hops": 3,
      "n_memory_sites": 2,
      "family": "43",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "compositional"
      ],
      "tags": [
        "family-43",
        "twin-disambiguation",
        "anticipability-mid",
        "md-high",
        "n-hops-3",
        "compositional",
        "wrong-confident-interlocutor",
        "family-roster"
      ]
    },
    "857-66-rome-project-what-romans-ate-v0": {
      "difficulty": "easy",
      "anticipability": 9,
      "burial_depth": 10580,
      "burial_depth_tokens": 1669983,
      "trace_lines": 11858,
      "trace_tokens": 1934564,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "66",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-66",
        "rome-project",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "857-67-parent-name-sabrina-lebron-v0": {
      "difficulty": "easy",
      "anticipability": 10,
      "burial_depth": 10843,
      "burial_depth_tokens": 1699168,
      "trace_lines": 11858,
      "trace_tokens": 1934564,
      "misdirection": "low",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "67",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-67",
        "parent-name",
        "anticipability-high",
        "md-low",
        "n-hops-1"
      ]
    },
    "857-68-move-on-from-fraction-addition-v0": {
      "difficulty": "hard",
      "anticipability": 6,
      "burial_depth": 3925,
      "burial_depth_tokens": 656541,
      "trace_lines": 11858,
      "trace_tokens": 1934564,
      "misdirection": "low",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "68",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-68",
        "student-preference",
        "anticipability-mid",
        "md-low",
        "n-hops-2"
      ]
    },
    "945-07a-use-abby-when-writing-TO-her-v0": {
      "difficulty": "medium",
      "anticipability": 9,
      "burial_depth": 610,
      "burial_depth_tokens": 149629,
      "trace_lines": 11630,
      "trace_tokens": 3745935,
      "misdirection": "high",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": null,
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-07a",
        "abby-name-to",
        "anticipability-high",
        "md-high",
        "n-hops-1"
      ]
    },
    "945-07a-use-abby-when-writing-TO-her-v1": {
      "difficulty": "medium",
      "anticipability": 6,
      "burial_depth": 610,
      "burial_depth_tokens": 149629,
      "trace_lines": 11630,
      "trace_tokens": 3745935,
      "misdirection": "high",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": null,
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-07a",
        "abby-name-to",
        "anticipability-mid",
        "md-high",
        "n-hops-1"
      ]
    },
    "945-07a-use-abby-when-writing-TO-her-v2": {
      "difficulty": "medium",
      "anticipability": 8,
      "burial_depth": 610,
      "burial_depth_tokens": 149629,
      "trace_lines": 11631,
      "trace_tokens": 3746109,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": null,
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-07a",
        "abby-name-to",
        "anticipability-high",
        "md-high",
        "n-hops-2"
      ]
    },
    "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1": {
      "difficulty": "medium",
      "anticipability": 6,
      "burial_depth": 610,
      "burial_depth_tokens": 149629,
      "trace_lines": 11631,
      "trace_tokens": 3746012,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 2,
      "family": null,
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-07b",
        "abby-name-about",
        "anticipability-mid",
        "md-high",
        "n-hops-2"
      ]
    },
    "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 2666,
      "burial_depth_tokens": 703140,
      "trace_lines": 11631,
      "trace_tokens": 3746012,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 3,
      "family": null,
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [],
      "tags": [
        "family-07b",
        "abby-name-about",
        "anticipability-high",
        "md-high",
        "n-hops-2",
        "trap"
      ]
    },
    "945-44-subject-exclusion-foreign-language-v0": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 15,
      "burial_depth_tokens": 2884,
      "trace_lines": 11630,
      "trace_tokens": 3745935,
      "misdirection": "mid",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "44",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-44",
        "foreign-lang-exclusion",
        "anticipability-high",
        "md-mid",
        "n-hops-1"
      ]
    },
    "945-44-subject-exclusion-foreign-language-v1": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 15,
      "burial_depth_tokens": 2884,
      "trace_lines": 11630,
      "trace_tokens": 3745935,
      "misdirection": "high",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "44",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-44",
        "foreign-lang-exclusion",
        "anticipability-high",
        "md-high",
        "n-hops-1",
        "concealed"
      ]
    },
    "945-44-subject-exclusion-foreign-language-v2": {
      "difficulty": "hard",
      "anticipability": 10,
      "burial_depth": 15,
      "burial_depth_tokens": 2884,
      "trace_lines": 11630,
      "trace_tokens": 3745935,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "44",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-44",
        "foreign-lang-exclusion",
        "anticipability-high",
        "md-high",
        "n-hops-2",
        "labeled-worksheet"
      ]
    },
    "945-44-subject-exclusion-foreign-language-v3": {
      "difficulty": "hard",
      "anticipability": 8,
      "burial_depth": 15,
      "burial_depth_tokens": 2884,
      "trace_lines": 11630,
      "trace_tokens": 3745935,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "44",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-44",
        "foreign-lang-exclusion",
        "anticipability-high",
        "md-high",
        "n-hops-2",
        "unlabeled"
      ]
    },
    "945-45-specific-named-speech-goals-v0": {
      "difficulty": "medium",
      "anticipability": 8,
      "burial_depth": 2666,
      "burial_depth_tokens": 703140,
      "trace_lines": 11630,
      "trace_tokens": 3745935,
      "misdirection": "mid",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "45",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-45",
        "speech-goal-problem-size",
        "anticipability-high",
        "md-mid",
        "n-hops-1"
      ]
    },
    "945-45-specific-named-speech-goals-v1": {
      "difficulty": "medium",
      "anticipability": 10,
      "burial_depth": 2667,
      "burial_depth_tokens": 703739,
      "trace_lines": 11630,
      "trace_tokens": 3745935,
      "misdirection": "mid",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "45",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-45",
        "speech-goal-7-word-sentences",
        "anticipability-high",
        "md-mid",
        "n-hops-2"
      ]
    },
    "945-98-grandfathered-pricing-with-cascading-patches-v0": {
      "difficulty": "hard",
      "anticipability": 10,
      "burial_depth": 11631,
      "burial_depth_tokens": 3745936,
      "trace_lines": 11631,
      "trace_tokens": 3746053,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "98",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "synthetic-patch"
      ],
      "tags": [
        "family-98",
        "grandfathered-pricing",
        "anticipability-high",
        "md-high",
        "n-hops-2",
        "synthetic-patch"
      ]
    },
    "945-98-grandfathered-pricing-with-cascading-patches-v1": {
      "difficulty": "hard",
      "anticipability": 9,
      "burial_depth": 11632,
      "burial_depth_tokens": 3746054,
      "trace_lines": 11632,
      "trace_tokens": 3746177,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "98",
      "category": "long-horizon-memory",
      "adversarial": true,
      "flags": [
        "synthetic-patch"
      ],
      "tags": [
        "family-98",
        "grandfathered-pricing",
        "anticipability-high",
        "md-high",
        "n-hops-2",
        "synthetic-patch",
        "two-patches"
      ]
    },
    "945-99-session-subject-4-item-closed-scope-v0": {
      "difficulty": "hard",
      "anticipability": 10,
      "burial_depth": 2660,
      "burial_depth_tokens": 700500,
      "trace_lines": 11630,
      "trace_tokens": 3745935,
      "misdirection": "mid",
      "n_hops": 1,
      "n_memory_sites": 1,
      "family": "99",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-99",
        "closed-scope-4-items",
        "anticipability-high",
        "md-mid",
        "n-hops-1"
      ]
    },
    "945-99-session-subject-4-item-closed-scope-v1": {
      "difficulty": "hard",
      "anticipability": 10,
      "burial_depth": 2599,
      "burial_depth_tokens": 669128,
      "trace_lines": 11630,
      "trace_tokens": 3745935,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "99",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [
        "new-stakeholder"
      ],
      "tags": [
        "family-99",
        "closed-scope-4-items",
        "anticipability-high",
        "md-high",
        "n-hops-2",
        "new-stakeholder"
      ]
    },
    "945-99-session-subject-4-item-closed-scope-v2": {
      "difficulty": "hard",
      "anticipability": 10,
      "burial_depth": 2660,
      "burial_depth_tokens": 700500,
      "trace_lines": 11630,
      "trace_tokens": 3745935,
      "misdirection": "high",
      "n_hops": 2,
      "n_memory_sites": 1,
      "family": "99",
      "category": "long-horizon-memory",
      "adversarial": false,
      "flags": [],
      "tags": [
        "family-99",
        "closed-scope-4-items",
        "anticipability-high",
        "md-high",
        "n-hops-2",
        "coordinating-teacher"
      ]
    }
  },
  "runs": [
    {
      "runKey": "rlm-opus-4.8",
      "harness": "trace-rlm",
      "model": "claude-opus-4.8",
      "modelName": "claude-opus-4.8",
      "reported": {
        "cost": 0.785,
        "tokens": 376000,
        "time": 212,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": true,
          "cost": 0.4764,
          "tokens": 349557,
          "time": 204.4
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": true,
          "cost": 3.6634,
          "tokens": 969968,
          "time": 278.0
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": true,
          "cost": 0.2358,
          "tokens": 111415,
          "time": 147.2
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": true,
          "cost": 0.2186,
          "tokens": 106799,
          "time": 122.3
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": true,
          "cost": 0.5263,
          "tokens": 336213,
          "time": 259.3
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": true,
          "cost": 0.3502,
          "tokens": 254581,
          "time": 223.4
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": false,
          "cost": 0.9474,
          "tokens": 772479,
          "time": 388.1
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": true,
          "cost": 0.7367,
          "tokens": 218977,
          "time": 121.5
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": false,
          "cost": 0.5644,
          "tokens": 422577,
          "time": 266.9
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": true,
          "cost": 0.2431,
          "tokens": 147164,
          "time": 138.2
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": false,
          "cost": 0.4412,
          "tokens": 322190,
          "time": 174.4
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": true,
          "cost": 0.447,
          "tokens": 287338,
          "time": 208.4
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": false,
          "cost": 1.6993,
          "tokens": 454407,
          "time": 324.4
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": false,
          "cost": 3.9441,
          "tokens": 712789,
          "time": 741.9
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": false,
          "cost": 0.5646,
          "tokens": 428783,
          "time": 238.2
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": true,
          "cost": 0.4434,
          "tokens": 350405,
          "time": 209.6
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": true,
          "cost": 1.2785,
          "tokens": 318606,
          "time": 174.8
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": true,
          "cost": 0.205,
          "tokens": 112547,
          "time": 100.3
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": false,
          "cost": 0.7511,
          "tokens": 581028,
          "time": 375.7
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": false,
          "cost": 4.8908,
          "tokens": 1813617,
          "time": 422.2
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 0.2622,
          "tokens": 142301,
          "time": 170.3
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": false,
          "cost": 0.6252,
          "tokens": 545854,
          "time": 261.5
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 0.5025,
          "tokens": 347311,
          "time": 216.4
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 0.2782,
          "tokens": 175422,
          "time": 200.8
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": false,
          "cost": 1.0359,
          "tokens": 1004111,
          "time": 402.8
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 1.6128,
          "tokens": 1143538,
          "time": 452.0
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 1.252,
          "tokens": 556392,
          "time": 344.9
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 1.0475,
          "tokens": 388574,
          "time": 303.6
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 1.3083,
          "tokens": 1074772,
          "time": 361.6
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 1.9706,
          "tokens": 514400,
          "time": 271.3
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": false,
          "cost": 0.4988,
          "tokens": 376677,
          "time": 261.4
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": false,
          "cost": 0.5703,
          "tokens": 295528,
          "time": 222.3
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": false,
          "cost": 0.9831,
          "tokens": 913978,
          "time": 366.2
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": true,
          "cost": 0.4126,
          "tokens": 274794,
          "time": 227.1
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 0.418,
          "tokens": 303896,
          "time": 240.7
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": true,
          "cost": 0.2571,
          "tokens": 149280,
          "time": 184.0
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 0.4172,
          "tokens": 279349,
          "time": 233.6
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 3.8678,
          "tokens": 1048739,
          "time": 283.9
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": false,
          "cost": 2.2505,
          "tokens": 630977,
          "time": 373.6
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 0.5581,
          "tokens": 394622,
          "time": 248.4
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": false,
          "cost": 2.8514,
          "tokens": 918247,
          "time": 274.1
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 0.4533,
          "tokens": 178149,
          "time": 163.0
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": false,
          "cost": 0.2536,
          "tokens": 116412,
          "time": 178.1
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": false,
          "cost": 0.3447,
          "tokens": 217764,
          "time": 161.0
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": true,
          "cost": 1.1438,
          "tokens": 410987,
          "time": 190.0
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 0.8421,
          "tokens": 468052,
          "time": 243.8
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": true,
          "cost": 0.1991,
          "tokens": 114233,
          "time": 95.8
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": true,
          "cost": 0.4246,
          "tokens": 279573,
          "time": 147.4
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": true,
          "cost": 0.254,
          "tokens": 141831,
          "time": 146.3
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": true,
          "cost": 0.4576,
          "tokens": 333956,
          "time": 159.7
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": true,
          "cost": 0.6955,
          "tokens": 317406,
          "time": 242.0
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": false,
          "cost": 0.659,
          "tokens": 510359,
          "time": 342.9
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": true,
          "cost": 0.6794,
          "tokens": 607051,
          "time": 187.4
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": true,
          "cost": 0.6876,
          "tokens": 485985,
          "time": 353.9
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 0.6895,
          "tokens": 490424,
          "time": 287.5
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 0.7968,
          "tokens": 736872,
          "time": 315.0
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 0.1502,
          "tokens": 81336,
          "time": 75.3
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": true,
          "cost": 0.3825,
          "tokens": 246926,
          "time": 220.1
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 0.3894,
          "tokens": 236342,
          "time": 141.6
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": true,
          "cost": 0.3055,
          "tokens": 175589,
          "time": 172.6
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": false,
          "cost": 0.4834,
          "tokens": 341065,
          "time": 247.1
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 0.8757,
          "tokens": 469316,
          "time": 262.5
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": true,
          "cost": 0.2047,
          "tokens": 88965,
          "time": 126.1
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": false,
          "cost": 0.417,
          "tokens": 278231,
          "time": 201.2
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": false,
          "cost": 0.5399,
          "tokens": 353371,
          "time": 287.1
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": true,
          "cost": 0.2991,
          "tokens": 205960,
          "time": 213.2
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": true,
          "cost": 0.5089,
          "tokens": 359452,
          "time": 252.1
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": true,
          "cost": 0.3432,
          "tokens": 222915,
          "time": 218.1
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": true,
          "cost": 0.3776,
          "tokens": 271786,
          "time": 172.5
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": true,
          "cost": 0.1122,
          "tokens": 50924,
          "time": 81.6
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": true,
          "cost": 0.3013,
          "tokens": 169013,
          "time": 146.6
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": true,
          "cost": 0.7429,
          "tokens": 636074,
          "time": 320.6
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 0.5498,
          "tokens": 317222,
          "time": 228.4
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 0.355,
          "tokens": 216333,
          "time": 185.5
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": false,
          "cost": 0.7515,
          "tokens": 593842,
          "time": 285.0
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": false,
          "cost": 1.7377,
          "tokens": 441104,
          "time": 291.2
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 0.3775,
          "tokens": 269512,
          "time": 169.1
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": false,
          "cost": 0.8785,
          "tokens": 823150,
          "time": 370.3
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 5.6619,
          "tokens": 1171157,
          "time": 183.7
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 0.255,
          "tokens": 168156,
          "time": 112.5
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.1054,
          "tokens": 44380,
          "time": 68.2
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": true,
          "cost": 0.1524,
          "tokens": 78231,
          "time": 108.4
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": true,
          "cost": 0.1931,
          "tokens": 101979,
          "time": 109.5
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": true,
          "cost": 0.4081,
          "tokens": 306242,
          "time": 175.5
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": false,
          "cost": 0.3567,
          "tokens": 155995,
          "time": 125.7
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": false,
          "cost": 0.2761,
          "tokens": 169582,
          "time": 152.3
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": true,
          "cost": 1.3726,
          "tokens": 1002912,
          "time": 306.5
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": true,
          "cost": 1.7808,
          "tokens": 368094,
          "time": 336.8
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": true,
          "cost": 0.592,
          "tokens": 445200,
          "time": 331.9
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": false,
          "cost": 1.2484,
          "tokens": 1334629,
          "time": 407.5
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": true,
          "cost": 0.2836,
          "tokens": 180671,
          "time": 195.1
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 0.2896,
          "tokens": 127100,
          "time": 135.2
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": true,
          "cost": 0.0972,
          "tokens": 51900,
          "time": 84.5
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": true,
          "cost": 0.1906,
          "tokens": 109156,
          "time": 126.9
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": false,
          "cost": 0.1602,
          "tokens": 74991,
          "time": 114.0
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": true,
          "cost": 1.3268,
          "tokens": 653891,
          "time": 205.5
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": false,
          "cost": 3.8238,
          "tokens": 919483,
          "time": 266.9
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": false,
          "cost": 0.6859,
          "tokens": 575083,
          "time": 260.2
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": true,
          "cost": 1.1579,
          "tokens": 416334,
          "time": 203.2
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": false,
          "cost": 0.9636,
          "tokens": 510573,
          "time": 309.0
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": true,
          "cost": 0.2932,
          "tokens": 188027,
          "time": 207.0
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": true,
          "cost": 0.6376,
          "tokens": 518411,
          "time": 279.7
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": true,
          "cost": 0.3629,
          "tokens": 254225,
          "time": 226.2
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": true,
          "cost": 0.5784,
          "tokens": 451651,
          "time": 267.7
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": false,
          "cost": 0.3763,
          "tokens": 270369,
          "time": 219.3
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": true,
          "cost": 0.576,
          "tokens": 436453,
          "time": 256.0
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": true,
          "cost": 0.2642,
          "tokens": 170374,
          "time": 129.9
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": true,
          "cost": 0.5695,
          "tokens": 443882,
          "time": 346.8
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": true,
          "cost": 0.3262,
          "tokens": 233135,
          "time": 133.9
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": true,
          "cost": 6.9272,
          "tokens": 1472142,
          "time": 197.0
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": true,
          "cost": 0.2472,
          "tokens": 161571,
          "time": 168.3
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": true,
          "cost": 0.1856,
          "tokens": 99477,
          "time": 135.4
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": true,
          "cost": 0.4574,
          "tokens": 227775,
          "time": 191.2
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": true,
          "cost": 0.1495,
          "tokens": 68762,
          "time": 83.2
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": true,
          "cost": 0.1889,
          "tokens": 107801,
          "time": 121.2
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": true,
          "cost": 0.1141,
          "tokens": 52560,
          "time": 72.2
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": true,
          "cost": 3.0527,
          "tokens": 1202999,
          "time": 360.2
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": true,
          "cost": 0.4295,
          "tokens": 307703,
          "time": 188.1
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": false,
          "cost": 0.4236,
          "tokens": 187519,
          "time": 162.8
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": true,
          "cost": 0.2423,
          "tokens": 137021,
          "time": 135.6
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": true,
          "cost": 0.1364,
          "tokens": 60618,
          "time": 122.0
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": true,
          "cost": 0.7577,
          "tokens": 572435,
          "time": 293.2
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 2.0117,
          "tokens": 1815121,
          "time": 568.6
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 0.3391,
          "tokens": 244727,
          "time": 154.6
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 0.1612,
          "tokens": 76649,
          "time": 94.2
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 0.2394,
          "tokens": 116280,
          "time": 184.4
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": true,
          "cost": 0.5185,
          "tokens": 308834,
          "time": 264.2
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": false,
          "cost": 0.3112,
          "tokens": 191067,
          "time": 159.9
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 0.3818,
          "tokens": 97714,
          "time": 108.6
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": true,
          "cost": 6.5779,
          "tokens": 1527174,
          "time": 266.0
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": false,
          "cost": 0.6083,
          "tokens": 524268,
          "time": 277.9
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": true,
          "cost": 0.3377,
          "tokens": 189629,
          "time": 166.5
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": true,
          "cost": 0.7091,
          "tokens": 332237,
          "time": 200.8
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": false,
          "cost": 0.4427,
          "tokens": 298160,
          "time": 225.2
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": false,
          "cost": 0.6839,
          "tokens": 324809,
          "time": 203.0
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": false,
          "cost": 0.1238,
          "tokens": 66009,
          "time": 91.2
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 0.3675,
          "tokens": 188207,
          "time": 172.3
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 0.6581,
          "tokens": 435730,
          "time": 286.0
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": true,
          "cost": 0.1816,
          "tokens": 91622,
          "time": 105.7
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": true,
          "cost": 0.4335,
          "tokens": 310854,
          "time": 158.0
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": true,
          "cost": 0.8638,
          "tokens": 498459,
          "time": 196.4
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": true,
          "cost": 2.2944,
          "tokens": 548247,
          "time": 181.8
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 1.1192,
          "tokens": 360123,
          "time": 240.8
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": false,
          "cost": 2.2209,
          "tokens": 701720,
          "time": 236.6
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 1.0934,
          "tokens": 364577,
          "time": 180.5
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": true,
          "cost": 0.2607,
          "tokens": 136844,
          "time": 122.4
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": true,
          "cost": 0.5679,
          "tokens": 410077,
          "time": 358.5
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": true,
          "cost": 0.099,
          "tokens": 49002,
          "time": 79.2
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": true,
          "cost": 0.4943,
          "tokens": 351123,
          "time": 221.8
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": true,
          "cost": 1.3214,
          "tokens": 426302,
          "time": 216.3
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": true,
          "cost": 0.1236,
          "tokens": 60160,
          "time": 92.7
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": true,
          "cost": 0.3286,
          "tokens": 174308,
          "time": 205.7
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 0.7771,
          "tokens": 415040,
          "time": 332.2
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 0.5778,
          "tokens": 462594,
          "time": 283.3
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 0.5668,
          "tokens": 425597,
          "time": 239.1
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": false,
          "cost": 0.5628,
          "tokens": 460243,
          "time": 210.2
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": false,
          "cost": 0.9196,
          "tokens": 859559,
          "time": 347.3
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": true,
          "cost": 0.3264,
          "tokens": 185409,
          "time": 201.7
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": true,
          "cost": 1.9305,
          "tokens": 586997,
          "time": 255.7
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": true,
          "cost": 0.3817,
          "tokens": 234131,
          "time": 230.6
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": false,
          "cost": 0.4713,
          "tokens": 315603,
          "time": 200.0
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": true,
          "cost": 1.7016,
          "tokens": 356150,
          "time": 92.1
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": true,
          "cost": 0.3775,
          "tokens": 225960,
          "time": 179.5
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 0.1259,
          "tokens": 75049,
          "time": 154.9
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": false,
          "cost": 0.4935,
          "tokens": 324774,
          "time": 253.2
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": true,
          "cost": 0.3693,
          "tokens": 191893,
          "time": 148.2
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": true,
          "cost": 0.155,
          "tokens": 76947,
          "time": 99.6
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": true,
          "cost": 0.1439,
          "tokens": 71777,
          "time": 126.0
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": true,
          "cost": 0.3123,
          "tokens": 199185,
          "time": 196.1
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 0.2792,
          "tokens": 108184,
          "time": 101.0
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 0.1765,
          "tokens": 88949,
          "time": 119.1
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.0734,
          "tokens": 36646,
          "time": 80.9
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": true,
          "cost": 0.3705,
          "tokens": 269864,
          "time": 155.0
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": false,
          "cost": 0.5403,
          "tokens": 431691,
          "time": 255.8
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": true,
          "cost": 0.5061,
          "tokens": 307930,
          "time": 192.2
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": true,
          "cost": 0.1424,
          "tokens": 57494,
          "time": 84.2
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": true,
          "cost": 1.6648,
          "tokens": 351157,
          "time": 132.8
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": false,
          "cost": 0.2211,
          "tokens": 132385,
          "time": 146.4
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 0.5256,
          "tokens": 409612,
          "time": 214.8
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": true,
          "cost": 0.5126,
          "tokens": 306118,
          "time": 241.4
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": true,
          "cost": 1.0706,
          "tokens": 543464,
          "time": 237.7
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": true,
          "cost": 0.4456,
          "tokens": 335929,
          "time": 232.7
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": false,
          "cost": 0.3847,
          "tokens": 280182,
          "time": 226.2
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 0.4649,
          "tokens": 319614,
          "time": 255.1
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": true,
          "cost": 0.3663,
          "tokens": 274085,
          "time": 235.9
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 0.6274,
          "tokens": 233042,
          "time": 186.6
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 0.4741,
          "tokens": 260494,
          "time": 207.0
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 0.6597,
          "tokens": 382291,
          "time": 212.6
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": false,
          "cost": 0.8695,
          "tokens": 544389,
          "time": 296.4
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": true,
          "cost": 0.394,
          "tokens": 277815,
          "time": 197.3
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 0.1728,
          "tokens": 97347,
          "time": 140.8
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": true,
          "cost": 1.1962,
          "tokens": 563000,
          "time": 260.0
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": true,
          "cost": 0.1224,
          "tokens": 64897,
          "time": 94.8
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 0.385,
          "tokens": 276565,
          "time": 237.1
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 0.3837,
          "tokens": 197963,
          "time": 141.4
        }
      ]
    },
    {
      "runKey": "openclaw-opus-4.8",
      "harness": "openclaw",
      "model": "claude-opus-4.8",
      "modelName": "claude-opus-4.8",
      "reported": {
        "cost": 1.429,
        "tokens": 184000,
        "time": 163,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": true,
          "cost": 1.1471,
          "tokens": 156302,
          "time": 136.0
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": false,
          "cost": 1.2263,
          "tokens": 160100,
          "time": 163.2
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": true,
          "cost": 1.0106,
          "tokens": 128180,
          "time": 149.9
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": true,
          "cost": 1.1166,
          "tokens": 165192,
          "time": 141.6
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": false,
          "cost": 1.4648,
          "tokens": 180476,
          "time": 194.5
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": true,
          "cost": 1.0662,
          "tokens": 143916,
          "time": 131.1
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": false,
          "cost": 1.1097,
          "tokens": 146535,
          "time": 158.5
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": true,
          "cost": 1.6135,
          "tokens": 184512,
          "time": 222.5
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": false,
          "cost": 2.1237,
          "tokens": 240085,
          "time": 241.7
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": true,
          "cost": 0.8925,
          "tokens": 141516,
          "time": 96.1
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": false,
          "cost": 1.0962,
          "tokens": 175866,
          "time": 123.1
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": true,
          "cost": 1.5546,
          "tokens": 175820,
          "time": 208.7
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": true,
          "cost": 2.5647,
          "tokens": 276063,
          "time": 256.1
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": false,
          "cost": 1.3782,
          "tokens": 205853,
          "time": 128.0
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": false,
          "cost": 1.2301,
          "tokens": 178692,
          "time": 138.8
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": true,
          "cost": 1.8824,
          "tokens": 239368,
          "time": 194.3
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 1.3834,
          "tokens": 204403,
          "time": 153.1
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": true,
          "cost": 1.1934,
          "tokens": 169993,
          "time": 140.8
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": false,
          "cost": 0.9872,
          "tokens": 141998,
          "time": 138.5
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": false,
          "cost": 1.5007,
          "tokens": 178181,
          "time": 236.0
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 1.1212,
          "tokens": 153440,
          "time": 149.2
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": true,
          "cost": 1.007,
          "tokens": 142984,
          "time": 144.1
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": true,
          "cost": 1.8172,
          "tokens": 208352,
          "time": 206.1
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 1.012,
          "tokens": 132995,
          "time": 142.4
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": true,
          "cost": 1.4724,
          "tokens": 206034,
          "time": 162.8
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 2.0663,
          "tokens": 222371,
          "time": 262.0
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 1.2165,
          "tokens": 137125,
          "time": 271.8
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 3.1875,
          "tokens": 283716,
          "time": 516.1
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 2.2298,
          "tokens": 235060,
          "time": 233.7
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 2.0221,
          "tokens": 252835,
          "time": 215.5
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": false,
          "cost": 1.269,
          "tokens": 171178,
          "time": 163.0
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": true,
          "cost": 1.7647,
          "tokens": 211223,
          "time": 219.5
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": true,
          "cost": 1.3129,
          "tokens": 174204,
          "time": 151.6
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": true,
          "cost": 1.3532,
          "tokens": 174535,
          "time": 170.1
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 1.1917,
          "tokens": 143630,
          "time": 207.3
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": true,
          "cost": 0.9037,
          "tokens": 140354,
          "time": 106.2
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 0.9236,
          "tokens": 120447,
          "time": 131.5
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 1.854,
          "tokens": 231381,
          "time": 234.9
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": false,
          "cost": 1.6065,
          "tokens": 219027,
          "time": 205.8
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 1.5869,
          "tokens": 181652,
          "time": 271.8
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": false,
          "cost": 0.9888,
          "tokens": 128119,
          "time": 145.6
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 1.0068,
          "tokens": 139539,
          "time": 152.9
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": false,
          "cost": 1.5047,
          "tokens": 169470,
          "time": 193.4
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": false,
          "cost": 2.0156,
          "tokens": 249941,
          "time": 193.0
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": true,
          "cost": 0.928,
          "tokens": 141515,
          "time": 109.9
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 1.0091,
          "tokens": 152775,
          "time": 130.4
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": true,
          "cost": 1.2581,
          "tokens": 195735,
          "time": 124.6
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": false,
          "cost": 0.8763,
          "tokens": 124023,
          "time": 100.3
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": true,
          "cost": 0.9927,
          "tokens": 147032,
          "time": 113.6
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": true,
          "cost": 2.2983,
          "tokens": 258125,
          "time": 249.8
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": true,
          "cost": 1.5454,
          "tokens": 243778,
          "time": 133.5
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": true,
          "cost": 1.7177,
          "tokens": 241719,
          "time": 145.8
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": true,
          "cost": 1.2952,
          "tokens": 161216,
          "time": 217.5
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": true,
          "cost": 1.4015,
          "tokens": 187456,
          "time": 166.9
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 3.0814,
          "tokens": 317304,
          "time": 333.8
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 2.2753,
          "tokens": 279960,
          "time": 239.8
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 0.8198,
          "tokens": 136087,
          "time": 83.2
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": true,
          "cost": 1.1088,
          "tokens": 159655,
          "time": 139.2
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 1.2182,
          "tokens": 190868,
          "time": 113.2
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": true,
          "cost": 1.4637,
          "tokens": 193731,
          "time": 162.3
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": true,
          "cost": 0.8973,
          "tokens": 131691,
          "time": 111.0
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 1.3133,
          "tokens": 183803,
          "time": 149.8
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": true,
          "cost": 1.8985,
          "tokens": 237550,
          "time": 223.1
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": false,
          "cost": 1.3651,
          "tokens": 170043,
          "time": 203.4
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": false,
          "cost": 1.2514,
          "tokens": 152562,
          "time": 191.7
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": true,
          "cost": 1.5139,
          "tokens": 208731,
          "time": 160.1
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": true,
          "cost": 1.84,
          "tokens": 230048,
          "time": 214.5
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": true,
          "cost": 1.4431,
          "tokens": 203484,
          "time": 133.7
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": true,
          "cost": 1.5369,
          "tokens": 202297,
          "time": 175.9
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": true,
          "cost": 1.099,
          "tokens": 152903,
          "time": 129.4
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": true,
          "cost": 0.7846,
          "tokens": 116373,
          "time": 103.1
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": true,
          "cost": 1.5535,
          "tokens": 201363,
          "time": 233.5
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 1.3067,
          "tokens": 163372,
          "time": 152.4
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 1.7051,
          "tokens": 227534,
          "time": 183.0
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": true,
          "cost": 1.6812,
          "tokens": 223242,
          "time": 172.8
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": false,
          "cost": 1.3302,
          "tokens": 173810,
          "time": 163.1
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 1.3546,
          "tokens": 182081,
          "time": 171.5
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": false,
          "cost": 1.6795,
          "tokens": 201804,
          "time": 229.2
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 1.6641,
          "tokens": 238924,
          "time": 165.3
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 0.7056,
          "tokens": 112651,
          "time": 80.3
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.8484,
          "tokens": 136938,
          "time": 92.7
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": false,
          "cost": 2.0638,
          "tokens": 247594,
          "time": 221.5
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": true,
          "cost": 1.3892,
          "tokens": 203606,
          "time": 139.5
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": true,
          "cost": 1.4072,
          "tokens": 186470,
          "time": 141.9
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": true,
          "cost": 1.5895,
          "tokens": 225593,
          "time": 175.5
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": true,
          "cost": 1.4817,
          "tokens": 190136,
          "time": 862.4
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": true,
          "cost": 1.5573,
          "tokens": 223817,
          "time": 150.4
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 0.9876,
          "tokens": 155619,
          "time": 113.5
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": true,
          "cost": 1.3901,
          "tokens": 179678,
          "time": 170.4
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": false,
          "cost": 2.1201,
          "tokens": 259797,
          "time": 233.1
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": true,
          "cost": 1.8562,
          "tokens": 239726,
          "time": 206.7
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 1.54,
          "tokens": 208425,
          "time": 183.3
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": true,
          "cost": 0.898,
          "tokens": 121365,
          "time": 109.1
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": true,
          "cost": 1.8236,
          "tokens": 230718,
          "time": 158.5
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": false,
          "cost": 0.8539,
          "tokens": 132280,
          "time": 103.2
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": true,
          "cost": 1.2798,
          "tokens": 172216,
          "time": 147.3
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": false,
          "cost": 2.0084,
          "tokens": 243508,
          "time": 221.7
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": true,
          "cost": 1.6371,
          "tokens": 209252,
          "time": 168.9
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": true,
          "cost": 1.1713,
          "tokens": 172616,
          "time": 124.0
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": true,
          "cost": 2.1228,
          "tokens": 259365,
          "time": 236.9
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": true,
          "cost": 1.5819,
          "tokens": 225427,
          "time": 182.2
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": false,
          "cost": 1.6064,
          "tokens": 185170,
          "time": 195.2
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": true,
          "cost": 1.708,
          "tokens": 247786,
          "time": 130.6
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": false,
          "cost": 2.4773,
          "tokens": 225178,
          "time": 486.9
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": false,
          "cost": 1.6226,
          "tokens": 196974,
          "time": 197.8
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": true,
          "cost": 1.5651,
          "tokens": 210589,
          "time": 173.6
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": true,
          "cost": 3.0494,
          "tokens": 293181,
          "time": 269.9
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": true,
          "cost": 2.2873,
          "tokens": 239288,
          "time": 325.2
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": true,
          "cost": 1.5658,
          "tokens": 196210,
          "time": 185.5
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": true,
          "cost": 1.3494,
          "tokens": 199382,
          "time": 130.5
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": true,
          "cost": 1.4408,
          "tokens": 201760,
          "time": 145.1
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": true,
          "cost": 0.8406,
          "tokens": 121651,
          "time": 103.1
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": true,
          "cost": 1.0025,
          "tokens": 138573,
          "time": 156.6
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": true,
          "cost": 1.477,
          "tokens": 219515,
          "time": 129.0
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": true,
          "cost": 0.9666,
          "tokens": 134036,
          "time": 107.4
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": true,
          "cost": 0.9116,
          "tokens": 124639,
          "time": 142.3
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": true,
          "cost": 1.3997,
          "tokens": 197361,
          "time": 147.4
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": true,
          "cost": 1.8615,
          "tokens": 233980,
          "time": 229.3
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": false,
          "cost": 1.4307,
          "tokens": 174526,
          "time": 187.4
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": true,
          "cost": 1.2159,
          "tokens": 188097,
          "time": 134.2
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": false,
          "cost": 1.6399,
          "tokens": 206683,
          "time": 175.2
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": true,
          "cost": 0.7983,
          "tokens": 126304,
          "time": 93.5
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 1.8948,
          "tokens": 225458,
          "time": 198.1
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 1.6074,
          "tokens": 230367,
          "time": 148.6
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 1.261,
          "tokens": 187297,
          "time": 122.5
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 1.7984,
          "tokens": 206610,
          "time": 246.3
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": false,
          "cost": 1.9927,
          "tokens": 223792,
          "time": 231.1
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": true,
          "cost": 2.0633,
          "tokens": 233970,
          "time": 218.3
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": true,
          "cost": 1.3104,
          "tokens": 162234,
          "time": 170.2
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": true,
          "cost": 0.8059,
          "tokens": 129443,
          "time": 95.3
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": true,
          "cost": 1.1707,
          "tokens": 154874,
          "time": 145.2
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": true,
          "cost": 1.8947,
          "tokens": 226311,
          "time": 235.3
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": true,
          "cost": 0.8268,
          "tokens": 115153,
          "time": 117.1
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": true,
          "cost": 1.0383,
          "tokens": 162895,
          "time": 115.8
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": true,
          "cost": 1.1487,
          "tokens": 147860,
          "time": 159.3
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": false,
          "cost": 1.494,
          "tokens": 199683,
          "time": 182.3
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 1.9829,
          "tokens": 208834,
          "time": 302.4
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 1.5328,
          "tokens": 206850,
          "time": 172.8
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": true,
          "cost": 1.0234,
          "tokens": 162751,
          "time": 97.8
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": false,
          "cost": 1.397,
          "tokens": 174435,
          "time": 160.6
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": true,
          "cost": 1.4471,
          "tokens": 214214,
          "time": 145.8
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": true,
          "cost": 0.9417,
          "tokens": 137324,
          "time": 125.7
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 1.4875,
          "tokens": 196136,
          "time": 190.7
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": false,
          "cost": 1.433,
          "tokens": 195620,
          "time": 160.5
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 1.4298,
          "tokens": 200890,
          "time": 158.9
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": false,
          "cost": 2.2327,
          "tokens": 251261,
          "time": 295.9
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": true,
          "cost": 1.4377,
          "tokens": 161863,
          "time": 243.2
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": true,
          "cost": 0.7798,
          "tokens": 121415,
          "time": 91.6
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": true,
          "cost": 1.203,
          "tokens": 163937,
          "time": 178.9
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": true,
          "cost": 2.5886,
          "tokens": 240208,
          "time": 553.5
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": true,
          "cost": 1.1369,
          "tokens": 153667,
          "time": 145.8
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": true,
          "cost": 1.2305,
          "tokens": 153103,
          "time": 174.3
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 1.4136,
          "tokens": 178359,
          "time": 186.5
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 1.5483,
          "tokens": 213261,
          "time": 159.6
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 1.6491,
          "tokens": 196103,
          "time": 202.7
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": true,
          "cost": 1.192,
          "tokens": 180044,
          "time": 124.5
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": false,
          "cost": 1.3365,
          "tokens": 152126,
          "time": 224.0
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": false,
          "cost": 1.4962,
          "tokens": 191709,
          "time": 179.1
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 1.5136,
          "tokens": 186827,
          "time": 194.0
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": true,
          "cost": 1.3627,
          "tokens": 160943,
          "time": 200.1
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": true,
          "cost": 1.5825,
          "tokens": 214930,
          "time": 164.9
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": true,
          "cost": 1.3502,
          "tokens": 186375,
          "time": 163.9
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": true,
          "cost": 1.6114,
          "tokens": 204202,
          "time": 198.0
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 0.9876,
          "tokens": 142527,
          "time": 112.4
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": true,
          "cost": 1.0457,
          "tokens": 145469,
          "time": 133.0
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": false,
          "cost": 1.6719,
          "tokens": 231603,
          "time": 162.2
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": true,
          "cost": 0.6656,
          "tokens": 103391,
          "time": 90.0
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": true,
          "cost": 1.1242,
          "tokens": 146968,
          "time": 140.5
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": true,
          "cost": 1.3268,
          "tokens": 179106,
          "time": 150.4
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 0.9873,
          "tokens": 144282,
          "time": 129.1
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 0.9802,
          "tokens": 137669,
          "time": 129.1
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.6612,
          "tokens": 97841,
          "time": 94.9
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": true,
          "cost": 0.8011,
          "tokens": 108412,
          "time": 112.6
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": false,
          "cost": 1.398,
          "tokens": 172461,
          "time": 183.9
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": true,
          "cost": 1.075,
          "tokens": 141831,
          "time": 138.7
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": true,
          "cost": 1.0126,
          "tokens": 143279,
          "time": 142.5
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": false,
          "cost": 1.9542,
          "tokens": 208858,
          "time": 250.8
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": false,
          "cost": 1.102,
          "tokens": 131000,
          "time": 153.4
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 1.3226,
          "tokens": 190590,
          "time": 146.1
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": false,
          "cost": 1.2882,
          "tokens": 158154,
          "time": 208.6
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": true,
          "cost": 1.2747,
          "tokens": 163446,
          "time": 166.5
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": true,
          "cost": 1.3543,
          "tokens": 163086,
          "time": 179.8
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": false,
          "cost": 1.1676,
          "tokens": 144675,
          "time": 164.4
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 1.6984,
          "tokens": 220785,
          "time": 204.4
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": true,
          "cost": 1.2767,
          "tokens": 134979,
          "time": 196.6
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 1.0618,
          "tokens": 123396,
          "time": 157.5
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 0.9638,
          "tokens": 120813,
          "time": 141.9
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 1.5649,
          "tokens": 157504,
          "time": 270.4
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": true,
          "cost": 2.1524,
          "tokens": 252728,
          "time": 255.8
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": true,
          "cost": 1.7319,
          "tokens": 225813,
          "time": 185.3
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": true,
          "cost": 1.1903,
          "tokens": 169192,
          "time": 135.3
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": false,
          "cost": 1.332,
          "tokens": 169916,
          "time": 194.4
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": false,
          "cost": 1.164,
          "tokens": 171020,
          "time": 152.5
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 0.9293,
          "tokens": 119285,
          "time": 172.7
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 1.6852,
          "tokens": 217350,
          "time": 202.6
        }
      ]
    },
    {
      "runKey": "openclaw-gpt-5.5",
      "harness": "openclaw",
      "model": "gpt-5.5",
      "modelName": "gpt-5.5",
      "reported": {
        "cost": 0.798,
        "tokens": 60000,
        "time": 225,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": false,
          "cost": 0.7925,
          "tokens": 48001,
          "time": 301.5
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": false,
          "cost": 0.3576,
          "tokens": 48752,
          "time": 158.9
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": true,
          "cost": 0.6158,
          "tokens": 50299,
          "time": 219.6
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": false,
          "cost": 0.9776,
          "tokens": 66063,
          "time": 315.2
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": false,
          "cost": 0.6594,
          "tokens": 50948,
          "time": 231.7
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": true,
          "cost": 0.5539,
          "tokens": 41833,
          "time": 214.9
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": false,
          "cost": 1.1129,
          "tokens": 73119,
          "time": 364.1
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": true,
          "cost": 0.764,
          "tokens": 57463,
          "time": 264.7
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": true,
          "cost": 0.3274,
          "tokens": 32422,
          "time": 143.7
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": true,
          "cost": 0.4072,
          "tokens": 33819,
          "time": 159.8
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": true,
          "cost": 0.7868,
          "tokens": 61218,
          "time": 240.8
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": true,
          "cost": 0.8157,
          "tokens": 59672,
          "time": 276.8
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": false,
          "cost": 0.9447,
          "tokens": 87822,
          "time": 269.7
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": true,
          "cost": 0.8139,
          "tokens": 58823,
          "time": 275.2
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": false,
          "cost": 1.1189,
          "tokens": 66427,
          "time": 321.0
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": false,
          "cost": 0.9864,
          "tokens": 104704,
          "time": 268.4
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 0.8415,
          "tokens": 64356,
          "time": 248.0
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": false,
          "cost": 0.483,
          "tokens": 41085,
          "time": 142.7
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": true,
          "cost": 1.1472,
          "tokens": 83390,
          "time": 307.4
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": true,
          "cost": 1.5016,
          "tokens": 104410,
          "time": 383.9
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 0.7669,
          "tokens": 62072,
          "time": 271.0
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": false,
          "cost": 0.7835,
          "tokens": 52646,
          "time": 229.2
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 1.0064,
          "tokens": 73955,
          "time": 277.1
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 0.7254,
          "tokens": 78994,
          "time": 203.3
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": false,
          "cost": 0.5422,
          "tokens": 47168,
          "time": 172.6
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 0.4701,
          "tokens": 43428,
          "time": 164.9
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 0.6998,
          "tokens": 55094,
          "time": 194.4
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 1.1754,
          "tokens": 88661,
          "time": 285.9
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 0.8679,
          "tokens": 73757,
          "time": 260.0
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": true,
          "cost": 0.6029,
          "tokens": 38449,
          "time": 200.0
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": false,
          "cost": 0.5271,
          "tokens": 40038,
          "time": 180.6
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": true,
          "cost": 1.4599,
          "tokens": 103656,
          "time": 383.2
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": true,
          "cost": 1.1975,
          "tokens": 83249,
          "time": 366.8
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": true,
          "cost": 1.6882,
          "tokens": 105715,
          "time": 423.9
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 1.4229,
          "tokens": 97386,
          "time": 355.6
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": true,
          "cost": 0.6442,
          "tokens": 48385,
          "time": 204.4
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 1.6015,
          "tokens": 83099,
          "time": 411.5
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 0.8888,
          "tokens": 72801,
          "time": 280.3
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": false,
          "cost": 1.1047,
          "tokens": 87750,
          "time": 353.8
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 0.7411,
          "tokens": 59132,
          "time": 272.7
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": true,
          "cost": 0.6813,
          "tokens": 54213,
          "time": 245.3
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 0.8966,
          "tokens": 62524,
          "time": 323.4
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": true,
          "cost": 0.4639,
          "tokens": 44335,
          "time": 164.8
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": true,
          "cost": 0.7954,
          "tokens": 58365,
          "time": 237.4
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": false,
          "cost": 0.7346,
          "tokens": 49489,
          "time": 247.6
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 0.9827,
          "tokens": 73853,
          "time": 292.5
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": false,
          "cost": 0.8129,
          "tokens": 86314,
          "time": 200.9
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": true,
          "cost": 0.5504,
          "tokens": 47639,
          "time": 167.7
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": true,
          "cost": 0.6463,
          "tokens": 47354,
          "time": 189.4
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": false,
          "cost": 0.5425,
          "tokens": 43082,
          "time": 182.1
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": true,
          "cost": 1.5548,
          "tokens": 91299,
          "time": 437.2
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": false,
          "cost": 0.8441,
          "tokens": 60148,
          "time": 284.3
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": true,
          "cost": 0.6355,
          "tokens": 51647,
          "time": 195.7
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": true,
          "cost": 1.1744,
          "tokens": 90439,
          "time": 372.8
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 0.588,
          "tokens": 51071,
          "time": 196.5
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 0.4594,
          "tokens": 43939,
          "time": 176.0
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 0.3279,
          "tokens": 29605,
          "time": 138.9
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": true,
          "cost": 0.8901,
          "tokens": 62351,
          "time": 306.1
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 0.6655,
          "tokens": 59382,
          "time": 203.3
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": true,
          "cost": 0.4306,
          "tokens": 42984,
          "time": 154.5
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": false,
          "cost": 0.7923,
          "tokens": 60935,
          "time": 226.6
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 1.6257,
          "tokens": 134491,
          "time": 327.6
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": true,
          "cost": 0.8426,
          "tokens": 90365,
          "time": 228.5
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": false,
          "cost": 0.8022,
          "tokens": 58506,
          "time": 287.8
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": false,
          "cost": 1.2252,
          "tokens": 76619,
          "time": 336.7
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": true,
          "cost": 0.7657,
          "tokens": 53111,
          "time": 199.3
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": true,
          "cost": 0.7602,
          "tokens": 54927,
          "time": 243.0
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": true,
          "cost": 0.3737,
          "tokens": 30241,
          "time": 136.1
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": true,
          "cost": 0.4852,
          "tokens": 30578,
          "time": 189.3
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": true,
          "cost": 0.3063,
          "tokens": 26829,
          "time": 109.9
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": true,
          "cost": 0.6471,
          "tokens": 57550,
          "time": 172.9
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": true,
          "cost": 1.7362,
          "tokens": 87386,
          "time": 392.5
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 0.7942,
          "tokens": 55678,
          "time": 260.5
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 0.7959,
          "tokens": 43241,
          "time": 292.8
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": false,
          "cost": 0.8264,
          "tokens": 61951,
          "time": 231.1
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": true,
          "cost": 1.3402,
          "tokens": 74487,
          "time": 418.4
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 0.8768,
          "tokens": 66280,
          "time": 280.3
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": false,
          "cost": 0.7083,
          "tokens": 60696,
          "time": 234.9
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 0.4442,
          "tokens": 41209,
          "time": 149.2
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 0.4597,
          "tokens": 33404,
          "time": 160.3
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.5465,
          "tokens": 60627,
          "time": 150.4
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": true,
          "cost": 0.8806,
          "tokens": 94054,
          "time": 234.5
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": true,
          "cost": 0.4675,
          "tokens": 35491,
          "time": 167.0
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": true,
          "cost": 0.9101,
          "tokens": 54487,
          "time": 274.9
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": true,
          "cost": 0.6488,
          "tokens": 48165,
          "time": 183.4
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": true,
          "cost": 1.0707,
          "tokens": 73312,
          "time": 283.9
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": true,
          "cost": 1.952,
          "tokens": 128900,
          "time": 430.1
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 0.8705,
          "tokens": 64814,
          "time": 297.7
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": true,
          "cost": 0.7125,
          "tokens": 55977,
          "time": 213.5
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": true,
          "cost": 0.7516,
          "tokens": 53444,
          "time": 244.7
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": true,
          "cost": 0.6463,
          "tokens": 53235,
          "time": 207.8
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 1.1028,
          "tokens": 72342,
          "time": 298.4
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": true,
          "cost": 0.4056,
          "tokens": 33324,
          "time": 131.5
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": true,
          "cost": 0.4633,
          "tokens": 36997,
          "time": 160.9
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": true,
          "cost": 0.4659,
          "tokens": 36423,
          "time": 147.5
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": true,
          "cost": 1.4224,
          "tokens": 103582,
          "time": 340.0
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": true,
          "cost": 1.3171,
          "tokens": 102131,
          "time": 294.0
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": true,
          "cost": 0.8626,
          "tokens": 82970,
          "time": 212.6
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": true,
          "cost": 0.6306,
          "tokens": 53347,
          "time": 166.4
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": true,
          "cost": 1.0362,
          "tokens": 80630,
          "time": 275.5
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": true,
          "cost": 0.5475,
          "tokens": 40424,
          "time": 185.6
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": true,
          "cost": 0.8367,
          "tokens": 61105,
          "time": 277.5
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": true,
          "cost": 1.0366,
          "tokens": 61109,
          "time": 287.2
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": false,
          "cost": 1.8865,
          "tokens": 158046,
          "time": 374.6
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": false,
          "cost": 0.7497,
          "tokens": 61983,
          "time": 222.0
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": true,
          "cost": 0.6108,
          "tokens": 45472,
          "time": 229.6
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": true,
          "cost": 1.3461,
          "tokens": 133251,
          "time": 279.2
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": true,
          "cost": 1.3286,
          "tokens": 92106,
          "time": 281.6
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": true,
          "cost": 0.558,
          "tokens": 41829,
          "time": 214.3
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": true,
          "cost": 0.6839,
          "tokens": 56793,
          "time": 280.1
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": true,
          "cost": 0.7627,
          "tokens": 50351,
          "time": 240.1
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": true,
          "cost": 0.8803,
          "tokens": 53286,
          "time": 262.7
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": false,
          "cost": 0.7245,
          "tokens": 47702,
          "time": 203.2
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": true,
          "cost": 0.7958,
          "tokens": 59022,
          "time": 208.8
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": true,
          "cost": 0.8649,
          "tokens": 62319,
          "time": 217.3
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": false,
          "cost": 0.969,
          "tokens": 75941,
          "time": 247.1
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": false,
          "cost": 2.2913,
          "tokens": 199319,
          "time": 426.4
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": true,
          "cost": 1.0955,
          "tokens": 82561,
          "time": 244.5
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": true,
          "cost": 0.3789,
          "tokens": 37790,
          "time": 124.4
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": true,
          "cost": 0.703,
          "tokens": 46580,
          "time": 232.7
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": false,
          "cost": 0.5254,
          "tokens": 40274,
          "time": 178.9
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": true,
          "cost": 0.4474,
          "tokens": 30857,
          "time": 189.8
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 0.9377,
          "tokens": 77383,
          "time": 231.2
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 0.4062,
          "tokens": 36615,
          "time": 120.7
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 0.5134,
          "tokens": 42110,
          "time": 147.0
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 1.2014,
          "tokens": 107653,
          "time": 266.0
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": true,
          "cost": 0.9636,
          "tokens": 66339,
          "time": 261.6
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": true,
          "cost": 0.3157,
          "tokens": 25737,
          "time": 117.3
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 0.4336,
          "tokens": 33805,
          "time": 154.4
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": false,
          "cost": 0.7923,
          "tokens": 78108,
          "time": 210.9
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": false,
          "cost": 0.5079,
          "tokens": 38210,
          "time": 154.8
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": false,
          "cost": 0.3947,
          "tokens": 34732,
          "time": 133.2
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": false,
          "cost": 0.5159,
          "tokens": 55445,
          "time": 182.2
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": false,
          "cost": 0.5766,
          "tokens": 44417,
          "time": 175.0
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": false,
          "cost": 0.8115,
          "tokens": 51143,
          "time": 256.0
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": true,
          "cost": 0.5308,
          "tokens": 33187,
          "time": 201.4
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 0.4949,
          "tokens": 43425,
          "time": 154.5
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": true,
          "cost": 1.0332,
          "tokens": 79939,
          "time": 255.7
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": true,
          "cost": 0.5319,
          "tokens": 36571,
          "time": 180.8
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": true,
          "cost": 0.9963,
          "tokens": 69077,
          "time": 262.0
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": true,
          "cost": 0.6321,
          "tokens": 50486,
          "time": 185.3
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": true,
          "cost": 0.8008,
          "tokens": 49817,
          "time": 233.5
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 0.5148,
          "tokens": 36441,
          "time": 185.9
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": false,
          "cost": 0.8188,
          "tokens": 60275,
          "time": 222.7
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 1.0196,
          "tokens": 51519,
          "time": 337.5
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": true,
          "cost": 0.6579,
          "tokens": 49843,
          "time": 181.4
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": true,
          "cost": 1.0809,
          "tokens": 65086,
          "time": 285.9
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": true,
          "cost": 0.3645,
          "tokens": 31134,
          "time": 152.5
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": false,
          "cost": 0.9588,
          "tokens": 70144,
          "time": 272.4
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": true,
          "cost": 0.6999,
          "tokens": 61212,
          "time": 202.2
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": true,
          "cost": 0.8473,
          "tokens": 64696,
          "time": 235.7
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": false,
          "cost": 0.78,
          "tokens": 54890,
          "time": 219.9
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 1.7565,
          "tokens": 116270,
          "time": 398.1
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 1.8528,
          "tokens": 104023,
          "time": 403.2
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 0.9295,
          "tokens": 72078,
          "time": 227.9
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": true,
          "cost": 0.5071,
          "tokens": 37466,
          "time": 155.8
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": false,
          "cost": 1.0679,
          "tokens": 69457,
          "time": 298.1
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": true,
          "cost": 0.4581,
          "tokens": 35127,
          "time": 169.8
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 1.2468,
          "tokens": 84178,
          "time": 315.2
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": true,
          "cost": 0.7006,
          "tokens": 49932,
          "time": 224.1
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": false,
          "cost": 0.7528,
          "tokens": 51514,
          "time": 215.9
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": false,
          "cost": 1.0647,
          "tokens": 83173,
          "time": 282.9
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": true,
          "cost": 1.1854,
          "tokens": 87451,
          "time": 310.3
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 0.4028,
          "tokens": 31471,
          "time": 140.4
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": true,
          "cost": 0.4584,
          "tokens": 36882,
          "time": 157.8
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": true,
          "cost": 0.4735,
          "tokens": 33839,
          "time": 158.0
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": true,
          "cost": 0.4562,
          "tokens": 44630,
          "time": 119.8
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": true,
          "cost": 0.6869,
          "tokens": 74858,
          "time": 160.5
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": true,
          "cost": 0.4629,
          "tokens": 36805,
          "time": 175.4
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 0.4282,
          "tokens": 31137,
          "time": 131.0
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 0.43,
          "tokens": 36855,
          "time": 153.0
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.5533,
          "tokens": 33934,
          "time": 180.9
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": true,
          "cost": 0.5223,
          "tokens": 30502,
          "time": 171.9
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": true,
          "cost": 0.6229,
          "tokens": 46590,
          "time": 185.9
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": false,
          "cost": 0.4627,
          "tokens": 38450,
          "time": 162.0
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": true,
          "cost": 0.3921,
          "tokens": 32402,
          "time": 143.4
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": true,
          "cost": 0.4326,
          "tokens": 35586,
          "time": 141.3
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": true,
          "cost": 0.3573,
          "tokens": 28810,
          "time": 129.5
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 0.812,
          "tokens": 61891,
          "time": 225.2
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": false,
          "cost": 0.827,
          "tokens": 63920,
          "time": 231.6
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": false,
          "cost": 0.8235,
          "tokens": 54507,
          "time": 258.3
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": true,
          "cost": 0.9001,
          "tokens": 62323,
          "time": 309.1
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": true,
          "cost": 0.844,
          "tokens": 74412,
          "time": 225.6
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 0.1785,
          "tokens": 14897,
          "time": 96.3
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": false,
          "cost": 0.5848,
          "tokens": 44358,
          "time": 184.8
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 0.4803,
          "tokens": 50970,
          "time": 136.9
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 0.7742,
          "tokens": 53997,
          "time": 238.8
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 0.3606,
          "tokens": 31048,
          "time": 127.8
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": true,
          "cost": 0.7947,
          "tokens": 56163,
          "time": 249.9
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": true,
          "cost": 0.8744,
          "tokens": 61069,
          "time": 221.8
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": true,
          "cost": 0.4052,
          "tokens": 33532,
          "time": 161.4
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": false,
          "cost": 1.0237,
          "tokens": 52466,
          "time": 313.7
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": false,
          "cost": 0.5939,
          "tokens": 45080,
          "time": 185.8
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": true,
          "cost": 0.6314,
          "tokens": 49302,
          "time": 201.3
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 1.5681,
          "tokens": 125132,
          "time": 382.6
        }
      ]
    },
    {
      "runKey": "openclaw-gemini-3.5-flash",
      "harness": "openclaw",
      "model": "gemini-3.5-flash",
      "modelName": "gemini-3.5-flash",
      "reported": {
        "cost": 0.992,
        "tokens": 447000,
        "time": 231,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": false,
          "cost": 1.2761,
          "tokens": 451157,
          "time": 304.2
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": false,
          "cost": 1.619,
          "tokens": 686829,
          "time": 315.0
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": false,
          "cost": 1.9737,
          "tokens": 754490,
          "time": 404.2
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": true,
          "cost": 1.2632,
          "tokens": 524019,
          "time": 271.1
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": true,
          "cost": 0.6448,
          "tokens": 249707,
          "time": 193.5
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": false,
          "cost": 0.7633,
          "tokens": 291390,
          "time": 206.6
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": true,
          "cost": 1.0473,
          "tokens": 463017,
          "time": 268.7
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": true,
          "cost": 0.9399,
          "tokens": 429226,
          "time": 217.9
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": true,
          "cost": 1.3011,
          "tokens": 680656,
          "time": 188.9
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": true,
          "cost": 0.6368,
          "tokens": 285301,
          "time": 162.8
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": true,
          "cost": 0.9469,
          "tokens": 408796,
          "time": 225.1
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": true,
          "cost": 1.3649,
          "tokens": 510236,
          "time": 381.6
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": true,
          "cost": 1.0891,
          "tokens": 474097,
          "time": 264.1
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": true,
          "cost": 0.7811,
          "tokens": 338535,
          "time": 187.0
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": true,
          "cost": 1.5608,
          "tokens": 720002,
          "time": 267.2
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": true,
          "cost": 0.7572,
          "tokens": 299260,
          "time": 221.3
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 0.0,
          "tokens": null,
          "time": 69.1
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": false,
          "cost": 0.0,
          "tokens": null,
          "time": 175.4
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": false,
          "cost": 0.0,
          "tokens": null,
          "time": 83.9
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": false,
          "cost": 0.0,
          "tokens": null,
          "time": 91.5
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 0.7569,
          "tokens": 328583,
          "time": 213.0
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": false,
          "cost": 0.0,
          "tokens": null,
          "time": 58.6
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 0.0,
          "tokens": null,
          "time": 51.7
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 0.7235,
          "tokens": 317331,
          "time": 188.3
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": false,
          "cost": 0.0,
          "tokens": null,
          "time": 99.6
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 0.0,
          "tokens": null,
          "time": 114.4
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 0.0,
          "tokens": null,
          "time": 82.1
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 0.0,
          "tokens": null,
          "time": 91.5
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 0.0,
          "tokens": null,
          "time": 88.1
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 0.0,
          "tokens": null,
          "time": 114.0
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": false,
          "cost": 0.0,
          "tokens": null,
          "time": 70.1
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": false,
          "cost": 0.0,
          "tokens": null,
          "time": 86.3
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": false,
          "cost": 2.6016,
          "tokens": 1060585,
          "time": 415.4
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": false,
          "cost": 0.0,
          "tokens": null,
          "time": 85.8
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 0.0,
          "tokens": null,
          "time": 106.9
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": true,
          "cost": 1.5858,
          "tokens": 654050,
          "time": 298.2
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 1.8021,
          "tokens": 754786,
          "time": 333.8
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 1.5266,
          "tokens": 651517,
          "time": 243.8
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": false,
          "cost": 1.0278,
          "tokens": 448937,
          "time": 280.7
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 0.9595,
          "tokens": 406546,
          "time": 247.9
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": true,
          "cost": 0.7815,
          "tokens": 373628,
          "time": 194.8
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 1.5718,
          "tokens": 633067,
          "time": 375.5
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": true,
          "cost": 0.7096,
          "tokens": 270420,
          "time": 209.0
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": true,
          "cost": 2.0621,
          "tokens": 894665,
          "time": 306.0
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": false,
          "cost": 0.9721,
          "tokens": 402910,
          "time": 245.5
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 0.77,
          "tokens": 334358,
          "time": 200.8
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": false,
          "cost": 1.0397,
          "tokens": 505805,
          "time": 180.5
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": true,
          "cost": 0.6452,
          "tokens": 305930,
          "time": 147.1
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": true,
          "cost": 0.5951,
          "tokens": 262618,
          "time": 136.3
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": true,
          "cost": 1.3624,
          "tokens": 611257,
          "time": 285.2
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": true,
          "cost": 1.4611,
          "tokens": 703447,
          "time": 290.0
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": true,
          "cost": 1.1676,
          "tokens": 510557,
          "time": 227.8
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": true,
          "cost": 2.0397,
          "tokens": 794936,
          "time": 400.4
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": false,
          "cost": 0.0,
          "tokens": null,
          "time": 224.2
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 1.6627,
          "tokens": 732558,
          "time": 364.0
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": true,
          "cost": 0.9015,
          "tokens": 378601,
          "time": 240.0
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 0.6538,
          "tokens": 313742,
          "time": 160.7
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": false,
          "cost": 1.6035,
          "tokens": 668640,
          "time": 294.5
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 0.5926,
          "tokens": 251414,
          "time": 170.0
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": true,
          "cost": 0.3674,
          "tokens": 202438,
          "time": 92.9
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": false,
          "cost": 0.6836,
          "tokens": 287832,
          "time": 197.2
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 1.786,
          "tokens": 689832,
          "time": 352.9
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": false,
          "cost": 5.9706,
          "tokens": 2062303,
          "time": 772.1
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": true,
          "cost": 1.8047,
          "tokens": 873754,
          "time": 286.8
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": true,
          "cost": 0.7251,
          "tokens": 289270,
          "time": 253.4
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": true,
          "cost": 1.0168,
          "tokens": 435048,
          "time": 216.5
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": true,
          "cost": 1.1002,
          "tokens": 511280,
          "time": 222.0
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": true,
          "cost": 1.0814,
          "tokens": 440502,
          "time": 239.6
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": true,
          "cost": 0.2116,
          "tokens": 84307,
          "time": 99.0
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": true,
          "cost": 0.1802,
          "tokens": 68996,
          "time": 89.7
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": true,
          "cost": 1.2508,
          "tokens": 558179,
          "time": 258.1
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": true,
          "cost": 1.4902,
          "tokens": 619543,
          "time": 309.0
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 0.9473,
          "tokens": 421283,
          "time": 214.6
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 1.3636,
          "tokens": 557376,
          "time": 362.0
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": true,
          "cost": 1.0487,
          "tokens": 421495,
          "time": 308.9
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": true,
          "cost": 0.746,
          "tokens": 319420,
          "time": 238.1
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 1.2277,
          "tokens": 477616,
          "time": 272.5
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": false,
          "cost": 1.1462,
          "tokens": 570432,
          "time": 234.6
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 0.7265,
          "tokens": 283913,
          "time": 261.1
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 0.7526,
          "tokens": 333444,
          "time": 199.8
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.5433,
          "tokens": 229637,
          "time": 203.4
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": true,
          "cost": 0.8001,
          "tokens": 335280,
          "time": 210.5
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": true,
          "cost": 0.8997,
          "tokens": 380514,
          "time": 238.2
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": true,
          "cost": 1.5265,
          "tokens": 671296,
          "time": 296.6
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": true,
          "cost": 1.25,
          "tokens": 626753,
          "time": 181.3
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": true,
          "cost": 1.1939,
          "tokens": 536817,
          "time": 236.7
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": true,
          "cost": 1.1398,
          "tokens": 456046,
          "time": 254.1
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 1.3223,
          "tokens": 544749,
          "time": 293.2
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": true,
          "cost": 1.1251,
          "tokens": 462661,
          "time": 260.7
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": true,
          "cost": 0.6014,
          "tokens": 278442,
          "time": 152.7
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": true,
          "cost": 1.0017,
          "tokens": 430899,
          "time": 271.2
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 1.2425,
          "tokens": 579611,
          "time": 266.2
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": true,
          "cost": 0.4658,
          "tokens": 193932,
          "time": 156.2
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": true,
          "cost": 0.7772,
          "tokens": 334266,
          "time": 184.5
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": true,
          "cost": 0.6592,
          "tokens": 259543,
          "time": 197.8
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": true,
          "cost": 1.1136,
          "tokens": 516005,
          "time": 242.3
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": true,
          "cost": 1.138,
          "tokens": 494025,
          "time": 255.6
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": true,
          "cost": 1.037,
          "tokens": 441494,
          "time": 217.8
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": true,
          "cost": 0.6318,
          "tokens": 243812,
          "time": 184.0
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": false,
          "cost": 0.0182,
          "tokens": 5209,
          "time": 47.4
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": true,
          "cost": 1.0193,
          "tokens": 427106,
          "time": 263.9
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": true,
          "cost": 1.4105,
          "tokens": 601615,
          "time": 305.3
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": true,
          "cost": 0.9024,
          "tokens": 426516,
          "time": 179.9
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": false,
          "cost": 0.2562,
          "tokens": 104877,
          "time": 96.8
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": false,
          "cost": 0.2547,
          "tokens": 121904,
          "time": 115.6
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": false,
          "cost": 1.3641,
          "tokens": 577868,
          "time": 294.4
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": false,
          "cost": 1.795,
          "tokens": 768485,
          "time": 283.7
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": false,
          "cost": 1.772,
          "tokens": 646155,
          "time": 385.4
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": true,
          "cost": 0.9208,
          "tokens": 403676,
          "time": 199.2
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": true,
          "cost": 1.1676,
          "tokens": 505892,
          "time": 218.6
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": true,
          "cost": 0.6208,
          "tokens": 273686,
          "time": 177.2
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": true,
          "cost": 0.5527,
          "tokens": 240409,
          "time": 149.5
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": true,
          "cost": 0.9054,
          "tokens": 352588,
          "time": 255.2
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": true,
          "cost": 0.7285,
          "tokens": 317361,
          "time": 196.2
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": true,
          "cost": 0.5693,
          "tokens": 261486,
          "time": 175.5
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": true,
          "cost": 0.6638,
          "tokens": 319073,
          "time": 135.8
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": true,
          "cost": 0.5679,
          "tokens": 267273,
          "time": 149.8
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": true,
          "cost": 2.401,
          "tokens": 952807,
          "time": 381.8
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": true,
          "cost": 0.5175,
          "tokens": 227862,
          "time": 163.2
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": true,
          "cost": 0.7057,
          "tokens": 294317,
          "time": 180.8
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": true,
          "cost": 0.8437,
          "tokens": 353809,
          "time": 217.1
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": true,
          "cost": 0.8849,
          "tokens": 366179,
          "time": 296.7
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 1.0649,
          "tokens": 476976,
          "time": 232.0
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 0.3975,
          "tokens": 190508,
          "time": 131.5
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": false,
          "cost": 0.0127,
          "tokens": 3358,
          "time": 49.9
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 0.8585,
          "tokens": 342166,
          "time": 274.7
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": false,
          "cost": 0.5068,
          "tokens": 200289,
          "time": 167.9
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": false,
          "cost": 2.3842,
          "tokens": 867108,
          "time": 551.8
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 0.5901,
          "tokens": 251476,
          "time": 186.6
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": false,
          "cost": 1.377,
          "tokens": 541418,
          "time": 332.5
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": true,
          "cost": 0.9604,
          "tokens": 382679,
          "time": 252.3
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": true,
          "cost": 2.158,
          "tokens": 930186,
          "time": 459.6
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": true,
          "cost": 0.5206,
          "tokens": 224264,
          "time": 149.1
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": true,
          "cost": 0.4989,
          "tokens": 194597,
          "time": 166.8
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": false,
          "cost": 1.5371,
          "tokens": 639946,
          "time": 277.9
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": true,
          "cost": 1.2391,
          "tokens": 494478,
          "time": 309.3
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 0.9646,
          "tokens": 372998,
          "time": 237.5
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 1.0502,
          "tokens": 511855,
          "time": 265.0
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": true,
          "cost": 0.7577,
          "tokens": 370648,
          "time": 172.2
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": true,
          "cost": 1.1701,
          "tokens": 491568,
          "time": 216.8
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": true,
          "cost": 0.199,
          "tokens": 74651,
          "time": 100.7
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": true,
          "cost": 0.5964,
          "tokens": 230169,
          "time": 166.6
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 1.1346,
          "tokens": 495530,
          "time": 274.4
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": false,
          "cost": 0.7678,
          "tokens": 352943,
          "time": 172.6
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 1.0892,
          "tokens": 445836,
          "time": 240.8
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": false,
          "cost": 3.2767,
          "tokens": 1130163,
          "time": 459.1
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": true,
          "cost": 1.0726,
          "tokens": 437220,
          "time": 251.0
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": true,
          "cost": 1.274,
          "tokens": 489240,
          "time": 283.9
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": true,
          "cost": 0.8161,
          "tokens": 336871,
          "time": 192.9
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": false,
          "cost": 0.9737,
          "tokens": 369990,
          "time": 273.5
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": true,
          "cost": 1.0128,
          "tokens": 435738,
          "time": 198.5
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": false,
          "cost": 1.1883,
          "tokens": 460606,
          "time": 290.4
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 2.68,
          "tokens": 1101051,
          "time": 468.1
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 1.4539,
          "tokens": 598166,
          "time": 280.1
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 1.4987,
          "tokens": 628312,
          "time": 334.3
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": true,
          "cost": 0.8562,
          "tokens": 354972,
          "time": 175.0
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": true,
          "cost": 0.9102,
          "tokens": 351127,
          "time": 280.7
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": true,
          "cost": 1.6168,
          "tokens": 589365,
          "time": 337.0
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 2.3746,
          "tokens": 764805,
          "time": 497.7
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": true,
          "cost": 1.2999,
          "tokens": 463553,
          "time": 325.4
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": true,
          "cost": 1.1357,
          "tokens": 503765,
          "time": 246.7
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": false,
          "cost": 1.4612,
          "tokens": 565906,
          "time": 444.1
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": false,
          "cost": 1.829,
          "tokens": 697752,
          "time": 454.7
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 0.3748,
          "tokens": 175830,
          "time": 99.2
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": true,
          "cost": 0.6165,
          "tokens": 256448,
          "time": 174.4
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": true,
          "cost": 1.0469,
          "tokens": 384310,
          "time": 251.6
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": false,
          "cost": 0.0335,
          "tokens": 18838,
          "time": 54.6
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": true,
          "cost": 0.5314,
          "tokens": 210780,
          "time": 169.3
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": true,
          "cost": 2.3914,
          "tokens": 964742,
          "time": 503.5
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 0.2972,
          "tokens": 123412,
          "time": 116.3
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 0.5574,
          "tokens": 212310,
          "time": 154.8
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.4882,
          "tokens": 229749,
          "time": 130.4
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": true,
          "cost": 0.8703,
          "tokens": 345301,
          "time": 212.2
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": true,
          "cost": 1.0535,
          "tokens": 432694,
          "time": 232.8
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": false,
          "cost": 1.0251,
          "tokens": 373679,
          "time": 296.6
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": false,
          "cost": 0.3127,
          "tokens": 124796,
          "time": 124.2
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": true,
          "cost": 0.5669,
          "tokens": 225424,
          "time": 185.1
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": true,
          "cost": 0.1477,
          "tokens": 51436,
          "time": 81.8
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 1.2356,
          "tokens": 456321,
          "time": 367.9
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": true,
          "cost": 2.6044,
          "tokens": 902834,
          "time": 531.9
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": true,
          "cost": 1.298,
          "tokens": 488351,
          "time": 333.1
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": true,
          "cost": 1.8087,
          "tokens": 738400,
          "time": 419.8
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": true,
          "cost": 0.9046,
          "tokens": 346723,
          "time": 268.0
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": true,
          "cost": 0.8358,
          "tokens": 361017,
          "time": 244.9
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": false,
          "cost": 0.6034,
          "tokens": 203765,
          "time": 204.2
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 0.6125,
          "tokens": 227446,
          "time": 212.2
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": true,
          "cost": 0.8437,
          "tokens": 328859,
          "time": 343.8
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 1.054,
          "tokens": 406681,
          "time": 312.4
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": true,
          "cost": 1.8881,
          "tokens": 627415,
          "time": 477.5
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": false,
          "cost": 0.7029,
          "tokens": 274800,
          "time": 240.6
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 1.7161,
          "tokens": 678554,
          "time": 322.6
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": false,
          "cost": 1.4199,
          "tokens": 489084,
          "time": 341.4
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": false,
          "cost": 1.3583,
          "tokens": 584677,
          "time": 254.1
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": true,
          "cost": 0.5343,
          "tokens": 236293,
          "time": 138.3
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 0.5965,
          "tokens": 242423,
          "time": 172.6
        }
      ]
    },
    {
      "runKey": "openclaw-gemini-3.1-pro",
      "harness": "openclaw",
      "model": "gemini-3.1-pro-preview",
      "modelName": "gemini-3.1-pro-preview",
      "reported": {
        "cost": 0.857,
        "tokens": 331000,
        "time": 172,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": false,
          "cost": 0.4514,
          "tokens": 190962,
          "time": 112.8
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": false,
          "cost": 0.9725,
          "tokens": 424431,
          "time": 145.9
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": true,
          "cost": 1.9475,
          "tokens": 775655,
          "time": 294.4
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": false,
          "cost": 1.364,
          "tokens": 520132,
          "time": 273.8
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": true,
          "cost": 0.799,
          "tokens": 292845,
          "time": 197.2
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": false,
          "cost": 0.638,
          "tokens": 267975,
          "time": 130.1
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": true,
          "cost": 1.1478,
          "tokens": 470072,
          "time": 176.3
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": true,
          "cost": 1.4366,
          "tokens": 519382,
          "time": 231.6
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": false,
          "cost": 1.088,
          "tokens": 459150,
          "time": 177.4
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": true,
          "cost": 1.0565,
          "tokens": 449988,
          "time": 149.1
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": true,
          "cost": 1.0588,
          "tokens": 421474,
          "time": 198.9
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": true,
          "cost": 1.0246,
          "tokens": 442136,
          "time": 153.4
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": false,
          "cost": 1.0586,
          "tokens": 456929,
          "time": 211.9
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": true,
          "cost": 0.3301,
          "tokens": 148755,
          "time": 86.6
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": false,
          "cost": 0.9656,
          "tokens": 370664,
          "time": 174.7
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": true,
          "cost": 1.0963,
          "tokens": 429577,
          "time": 194.3
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 1.6571,
          "tokens": 566761,
          "time": 368.4
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": false,
          "cost": 0.7217,
          "tokens": 282455,
          "time": 154.1
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": false,
          "cost": 0.5877,
          "tokens": 222612,
          "time": 248.7
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": true,
          "cost": 2.6597,
          "tokens": 977726,
          "time": 438.4
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 0.6169,
          "tokens": 259231,
          "time": 144.9
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": true,
          "cost": 0.904,
          "tokens": 349824,
          "time": 199.2
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 0.786,
          "tokens": 312310,
          "time": 211.6
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 0.9141,
          "tokens": 350057,
          "time": 205.6
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": true,
          "cost": 1.0555,
          "tokens": 400672,
          "time": 235.4
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 0.6022,
          "tokens": 244985,
          "time": 172.4
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 0.5639,
          "tokens": 205244,
          "time": 180.0
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 0.2945,
          "tokens": 107689,
          "time": 126.6
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 1.1034,
          "tokens": 459354,
          "time": 183.5
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 1.4683,
          "tokens": 625762,
          "time": 198.8
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": false,
          "cost": 0.4969,
          "tokens": 208396,
          "time": 112.3
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": true,
          "cost": 0.8798,
          "tokens": 342957,
          "time": 190.1
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": false,
          "cost": 0.7012,
          "tokens": 294755,
          "time": 169.4
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": false,
          "cost": 0.647,
          "tokens": 285990,
          "time": 110.8
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 0.6196,
          "tokens": 259737,
          "time": 161.0
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": true,
          "cost": 1.3366,
          "tokens": 559164,
          "time": 242.1
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 0.6138,
          "tokens": 238166,
          "time": 156.6
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 0.9714,
          "tokens": 397354,
          "time": 161.1
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": false,
          "cost": 0.5259,
          "tokens": 199132,
          "time": 160.1
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 0.6038,
          "tokens": 247610,
          "time": 156.5
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": false,
          "cost": 0.5403,
          "tokens": 213093,
          "time": 130.4
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 1.2463,
          "tokens": 465132,
          "time": 261.4
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": false,
          "cost": 1.08,
          "tokens": 405529,
          "time": 272.7
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": true,
          "cost": 0.5869,
          "tokens": 243868,
          "time": 121.9
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": true,
          "cost": 2.4997,
          "tokens": 921886,
          "time": 324.2
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 0.5917,
          "tokens": 247697,
          "time": 147.5
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": true,
          "cost": 0.3641,
          "tokens": 158168,
          "time": 110.9
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": false,
          "cost": 0.0513,
          "tokens": 22450,
          "time": 62.2
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": true,
          "cost": 1.3596,
          "tokens": 531792,
          "time": 205.3
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": true,
          "cost": 1.0896,
          "tokens": 475840,
          "time": 176.0
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": true,
          "cost": 0.7103,
          "tokens": 284841,
          "time": 139.9
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": false,
          "cost": 0.7647,
          "tokens": 341833,
          "time": 144.8
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": false,
          "cost": 0.8236,
          "tokens": 325685,
          "time": 172.7
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": false,
          "cost": 0.9221,
          "tokens": 329123,
          "time": 261.0
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 1.4358,
          "tokens": 557141,
          "time": 231.1
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 0.9758,
          "tokens": 397203,
          "time": 185.3
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 0.3383,
          "tokens": 153989,
          "time": 86.0
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": true,
          "cost": 0.6711,
          "tokens": 276174,
          "time": 138.7
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 0.7595,
          "tokens": 313684,
          "time": 154.2
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": false,
          "cost": 0.0468,
          "tokens": 19454,
          "time": 54.7
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": false,
          "cost": 0.835,
          "tokens": 330992,
          "time": 178.2
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 1.3619,
          "tokens": 579757,
          "time": 194.1
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": true,
          "cost": 1.3909,
          "tokens": 516411,
          "time": 299.6
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": false,
          "cost": 0.8016,
          "tokens": 301247,
          "time": 243.5
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": true,
          "cost": 0.6032,
          "tokens": 220681,
          "time": 194.2
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": true,
          "cost": 0.38,
          "tokens": 147477,
          "time": 123.8
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": false,
          "cost": 2.4728,
          "tokens": 842883,
          "time": 425.0
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": true,
          "cost": 1.5699,
          "tokens": 567771,
          "time": 330.8
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": false,
          "cost": 0.052,
          "tokens": 19021,
          "time": 70.1
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": true,
          "cost": 0.2615,
          "tokens": 101469,
          "time": 104.3
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": true,
          "cost": 0.3092,
          "tokens": 117031,
          "time": 125.9
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": true,
          "cost": 1.2663,
          "tokens": 462447,
          "time": 313.8
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 0.4543,
          "tokens": 170996,
          "time": 147.5
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 1.0907,
          "tokens": 434811,
          "time": 196.6
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": false,
          "cost": 1.4447,
          "tokens": 525540,
          "time": 336.4
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": true,
          "cost": 1.0015,
          "tokens": 389360,
          "time": 214.1
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 0.5472,
          "tokens": 214579,
          "time": 144.0
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": true,
          "cost": 0.2566,
          "tokens": 99142,
          "time": 100.5
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 1.3691,
          "tokens": 541874,
          "time": 264.3
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 0.3352,
          "tokens": 144397,
          "time": 116.9
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.9998,
          "tokens": 408718,
          "time": 191.3
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": true,
          "cost": 0.6669,
          "tokens": 233374,
          "time": 200.2
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": true,
          "cost": 0.2626,
          "tokens": 100290,
          "time": 114.3
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": false,
          "cost": 1.335,
          "tokens": 550542,
          "time": 245.2
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": true,
          "cost": 0.7198,
          "tokens": 305522,
          "time": 137.1
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": true,
          "cost": 1.7289,
          "tokens": 645198,
          "time": 281.0
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": true,
          "cost": 0.4942,
          "tokens": 189750,
          "time": 163.2
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 0.5651,
          "tokens": 233155,
          "time": 131.8
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": true,
          "cost": 0.9819,
          "tokens": 391652,
          "time": 180.5
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": false,
          "cost": 1.0709,
          "tokens": 396538,
          "time": 215.2
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": true,
          "cost": 0.8914,
          "tokens": 321751,
          "time": 199.7
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 0.7042,
          "tokens": 260238,
          "time": 158.3
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": true,
          "cost": 0.3882,
          "tokens": 149513,
          "time": 137.8
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": true,
          "cost": 0.9058,
          "tokens": 328819,
          "time": 206.6
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": true,
          "cost": 1.3952,
          "tokens": 497328,
          "time": 318.7
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": true,
          "cost": 2.6546,
          "tokens": 1028778,
          "time": 305.8
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": false,
          "cost": 0.5259,
          "tokens": 209789,
          "time": 126.2
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": true,
          "cost": 0.4291,
          "tokens": 171413,
          "time": 131.5
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": true,
          "cost": 1.2194,
          "tokens": 519550,
          "time": 165.6
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": false,
          "cost": 0.5739,
          "tokens": 223782,
          "time": 138.7
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": false,
          "cost": 0.1669,
          "tokens": 68060,
          "time": 213.8
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": true,
          "cost": 0.9766,
          "tokens": 424617,
          "time": 178.8
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": true,
          "cost": 0.5986,
          "tokens": 246950,
          "time": 155.7
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": false,
          "cost": 1.1536,
          "tokens": 471461,
          "time": 188.0
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": false,
          "cost": 0.9812,
          "tokens": 384104,
          "time": 207.3
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": true,
          "cost": 1.5347,
          "tokens": 548006,
          "time": 339.8
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": false,
          "cost": 0.0781,
          "tokens": 31355,
          "time": 60.3
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": false,
          "cost": 1.493,
          "tokens": 537207,
          "time": 336.9
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": true,
          "cost": 0.5639,
          "tokens": 230176,
          "time": 125.4
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": true,
          "cost": 0.733,
          "tokens": 299148,
          "time": 135.7
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": true,
          "cost": 0.833,
          "tokens": 311529,
          "time": 203.7
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": true,
          "cost": 0.576,
          "tokens": 241685,
          "time": 127.8
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": true,
          "cost": 1.0048,
          "tokens": 371942,
          "time": 206.8
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": true,
          "cost": 0.8116,
          "tokens": 318511,
          "time": 171.5
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": true,
          "cost": 0.8557,
          "tokens": 302274,
          "time": 213.1
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": true,
          "cost": 0.176,
          "tokens": 62757,
          "time": 90.7
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": true,
          "cost": 0.311,
          "tokens": 121496,
          "time": 123.8
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": true,
          "cost": 2.7292,
          "tokens": 973970,
          "time": 336.3
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": false,
          "cost": 0.2913,
          "tokens": 122279,
          "time": 88.2
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": true,
          "cost": 0.3565,
          "tokens": 149810,
          "time": 102.6
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": true,
          "cost": 0.7139,
          "tokens": 281123,
          "time": 185.2
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": true,
          "cost": 0.2676,
          "tokens": 98727,
          "time": 111.7
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 0.5567,
          "tokens": 227394,
          "time": 127.4
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 0.6241,
          "tokens": 253254,
          "time": 140.2
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 0.5708,
          "tokens": 236402,
          "time": 127.6
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": true,
          "cost": 0.4116,
          "tokens": 147411,
          "time": 148.9
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": false,
          "cost": 0.5658,
          "tokens": 217329,
          "time": 144.2
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": true,
          "cost": 2.2142,
          "tokens": 1002602,
          "time": 152.7
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": false,
          "cost": 0.91,
          "tokens": 339973,
          "time": 204.2
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": true,
          "cost": 0.4167,
          "tokens": 163345,
          "time": 121.8
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": false,
          "cost": 1.7699,
          "tokens": 616251,
          "time": 371.6
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": true,
          "cost": 0.4983,
          "tokens": 190274,
          "time": 141.4
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": true,
          "cost": 0.9681,
          "tokens": 394835,
          "time": 165.6
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": false,
          "cost": 0.3366,
          "tokens": 131265,
          "time": 104.0
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": true,
          "cost": 0.6917,
          "tokens": 263231,
          "time": 184.4
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 1.4314,
          "tokens": 516627,
          "time": 282.2
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": true,
          "cost": 0.6146,
          "tokens": 249848,
          "time": 178.1
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": false,
          "cost": 0.2602,
          "tokens": 100895,
          "time": 97.5
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": true,
          "cost": 0.272,
          "tokens": 112883,
          "time": 88.7
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": true,
          "cost": 0.3195,
          "tokens": 128193,
          "time": 87.9
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": true,
          "cost": 0.9649,
          "tokens": 374106,
          "time": 230.3
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 0.9016,
          "tokens": 338161,
          "time": 201.4
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": true,
          "cost": 0.2715,
          "tokens": 108796,
          "time": 90.4
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 0.6351,
          "tokens": 244675,
          "time": 138.5
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": true,
          "cost": 0.5242,
          "tokens": 227829,
          "time": 122.9
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": true,
          "cost": 0.6921,
          "tokens": 262075,
          "time": 174.6
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": true,
          "cost": 0.9829,
          "tokens": 372861,
          "time": 206.1
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": false,
          "cost": 1.2294,
          "tokens": 439766,
          "time": 324.2
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": false,
          "cost": 0.6957,
          "tokens": 263640,
          "time": 170.9
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": true,
          "cost": 1.0001,
          "tokens": 369281,
          "time": 222.0
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": true,
          "cost": 1.0861,
          "tokens": 423046,
          "time": 199.9
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 2.7887,
          "tokens": 955082,
          "time": 555.3
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 2.2815,
          "tokens": 859617,
          "time": 397.7
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 0.9925,
          "tokens": 333544,
          "time": 305.4
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": false,
          "cost": 1.2514,
          "tokens": 428247,
          "time": 264.7
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": false,
          "cost": 0.8159,
          "tokens": 329632,
          "time": 207.6
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": true,
          "cost": 0.5749,
          "tokens": 222671,
          "time": 160.0
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 1.4564,
          "tokens": 544708,
          "time": 287.4
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": true,
          "cost": 1.745,
          "tokens": 614915,
          "time": 367.1
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": false,
          "cost": 0.5608,
          "tokens": 229765,
          "time": 134.9
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": false,
          "cost": 1.6,
          "tokens": 504013,
          "time": 364.8
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": false,
          "cost": 0.5141,
          "tokens": 188988,
          "time": 151.4
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 1.1577,
          "tokens": 488857,
          "time": 150.8
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": true,
          "cost": 0.1618,
          "tokens": 63144,
          "time": 77.9
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": true,
          "cost": 0.2038,
          "tokens": 67170,
          "time": 105.8
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": true,
          "cost": 0.2422,
          "tokens": 87902,
          "time": 104.7
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": true,
          "cost": 0.5513,
          "tokens": 234866,
          "time": 129.4
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": true,
          "cost": 0.3109,
          "tokens": 124698,
          "time": 99.7
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 0.6265,
          "tokens": 258810,
          "time": 138.4
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 0.697,
          "tokens": 276228,
          "time": 181.9
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.7116,
          "tokens": 275480,
          "time": 210.6
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": true,
          "cost": 0.4038,
          "tokens": 177527,
          "time": 88.8
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": true,
          "cost": 1.5203,
          "tokens": 574858,
          "time": 263.0
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": false,
          "cost": 0.8666,
          "tokens": 300141,
          "time": 208.2
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": false,
          "cost": 0.3126,
          "tokens": 124608,
          "time": 86.5
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": true,
          "cost": 0.8459,
          "tokens": 312260,
          "time": 214.0
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": true,
          "cost": 0.2044,
          "tokens": 77244,
          "time": 88.3
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 0.9107,
          "tokens": 359311,
          "time": 205.1
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": true,
          "cost": 1.5169,
          "tokens": 526408,
          "time": 350.0
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": true,
          "cost": 0.6282,
          "tokens": 237866,
          "time": 153.5
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": false,
          "cost": 0.9675,
          "tokens": 331441,
          "time": 257.1
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": false,
          "cost": 0.5137,
          "tokens": 204278,
          "time": 136.0
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 0.265,
          "tokens": 113379,
          "time": 83.4
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": false,
          "cost": 0.666,
          "tokens": 207205,
          "time": 202.0
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": true,
          "cost": 1.2423,
          "tokens": 447293,
          "time": 266.0
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": true,
          "cost": 0.686,
          "tokens": 275175,
          "time": 147.2
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 0.5186,
          "tokens": 176959,
          "time": 172.0
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": false,
          "cost": 1.2114,
          "tokens": 473570,
          "time": 231.5
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": false,
          "cost": 0.4423,
          "tokens": 168402,
          "time": 131.6
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 0.467,
          "tokens": 195367,
          "time": 117.9
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": false,
          "cost": 0.7709,
          "tokens": 285223,
          "time": 273.9
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": true,
          "cost": 0.6009,
          "tokens": 245581,
          "time": 132.2
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 0.451,
          "tokens": 162448,
          "time": 145.8
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 0.4301,
          "tokens": 162210,
          "time": 121.0
        }
      ]
    },
    {
      "runKey": "openclaw-sonnet-4.5",
      "harness": "openclaw",
      "model": "claude-sonnet-4.5",
      "modelName": "claude-sonnet-4.5",
      "reported": {
        "cost": 1.564,
        "tokens": 458000,
        "time": 161,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": false,
          "cost": 2.8574,
          "tokens": 865650,
          "time": 177.8
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": false,
          "cost": 1.3141,
          "tokens": 372774,
          "time": 153.9
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": false,
          "cost": 2.5063,
          "tokens": 738829,
          "time": 209.0
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": false,
          "cost": 1.8423,
          "tokens": 541538,
          "time": 162.8
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": false,
          "cost": 1.5105,
          "tokens": 440987,
          "time": 162.0
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": true,
          "cost": 2.1127,
          "tokens": 635862,
          "time": 171.8
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": false,
          "cost": 0.7373,
          "tokens": 206454,
          "time": 122.0
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": true,
          "cost": 1.86,
          "tokens": 540919,
          "time": 168.6
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": true,
          "cost": 1.0173,
          "tokens": 289659,
          "time": 134.3
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": true,
          "cost": 1.6264,
          "tokens": 474365,
          "time": 168.1
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": true,
          "cost": 1.7056,
          "tokens": 510395,
          "time": 168.7
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": true,
          "cost": 1.065,
          "tokens": 292806,
          "time": 167.6
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": false,
          "cost": 1.7928,
          "tokens": 522691,
          "time": 173.3
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": true,
          "cost": 0.6706,
          "tokens": 185727,
          "time": 102.4
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": true,
          "cost": 1.8882,
          "tokens": 557936,
          "time": 195.2
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": true,
          "cost": 1.655,
          "tokens": 496731,
          "time": 148.3
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 1.3841,
          "tokens": 401627,
          "time": 162.5
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": true,
          "cost": 2.1303,
          "tokens": 621254,
          "time": 208.7
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": false,
          "cost": 1.6957,
          "tokens": 496518,
          "time": 192.7
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": false,
          "cost": 2.5737,
          "tokens": 764105,
          "time": 251.7
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 1.3406,
          "tokens": 393923,
          "time": 159.1
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": true,
          "cost": 1.1087,
          "tokens": 316478,
          "time": 171.0
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": true,
          "cost": 1.7525,
          "tokens": 514745,
          "time": 196.2
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 1.7568,
          "tokens": 527490,
          "time": 156.8
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": true,
          "cost": 2.6424,
          "tokens": 796947,
          "time": 226.7
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 1.4603,
          "tokens": 438070,
          "time": 159.3
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 2.6028,
          "tokens": 801261,
          "time": 188.8
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 2.376,
          "tokens": 704782,
          "time": 234.8
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 1.7948,
          "tokens": 509206,
          "time": 219.4
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 2.1873,
          "tokens": 651403,
          "time": 211.3
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": false,
          "cost": 1.2695,
          "tokens": 368334,
          "time": 159.6
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": false,
          "cost": 2.8033,
          "tokens": 849401,
          "time": 209.0
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": false,
          "cost": 1.7422,
          "tokens": 504797,
          "time": 212.9
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": false,
          "cost": 0.7978,
          "tokens": 210656,
          "time": 141.8
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 2.3957,
          "tokens": 712933,
          "time": 227.8
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": true,
          "cost": 0.9969,
          "tokens": 280681,
          "time": 126.1
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 1.2854,
          "tokens": 362981,
          "time": 180.9
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 2.1597,
          "tokens": 632246,
          "time": 193.4
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": false,
          "cost": 1.9423,
          "tokens": 555811,
          "time": 248.2
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 2.1312,
          "tokens": 608657,
          "time": 256.9
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": false,
          "cost": 2.0348,
          "tokens": 607762,
          "time": 170.9
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 1.107,
          "tokens": 316296,
          "time": 142.8
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": true,
          "cost": 1.0141,
          "tokens": 279873,
          "time": 157.8
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": false,
          "cost": 2.1544,
          "tokens": 627420,
          "time": 213.6
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": false,
          "cost": 1.6207,
          "tokens": 486547,
          "time": 146.0
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": true,
          "cost": 1.8246,
          "tokens": 549176,
          "time": 135.4
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": true,
          "cost": 0.3383,
          "tokens": 88456,
          "time": 89.4
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": false,
          "cost": 0.6866,
          "tokens": 192446,
          "time": 113.6
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": true,
          "cost": 0.6888,
          "tokens": 191513,
          "time": 116.9
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": true,
          "cost": 0.8908,
          "tokens": 260686,
          "time": 120.0
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": true,
          "cost": 1.9994,
          "tokens": 600310,
          "time": 185.3
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": false,
          "cost": 1.1253,
          "tokens": 329032,
          "time": 140.4
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": false,
          "cost": 1.001,
          "tokens": 294928,
          "time": 118.5
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": false,
          "cost": 2.1408,
          "tokens": 598877,
          "time": 264.0
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 0.623,
          "tokens": 172873,
          "time": 118.0
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 2.0254,
          "tokens": 617769,
          "time": 144.7
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 0.8557,
          "tokens": 248558,
          "time": 111.8
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": true,
          "cost": 1.6226,
          "tokens": 495367,
          "time": 135.1
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 0.9519,
          "tokens": 269476,
          "time": 122.2
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": true,
          "cost": 1.496,
          "tokens": 443302,
          "time": 161.9
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": false,
          "cost": 0.6736,
          "tokens": 183932,
          "time": 122.3
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 2.6075,
          "tokens": 768823,
          "time": 223.4
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": true,
          "cost": 1.2545,
          "tokens": 360501,
          "time": 168.8
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": false,
          "cost": 1.3182,
          "tokens": 361415,
          "time": 189.3
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": true,
          "cost": 1.0141,
          "tokens": 287384,
          "time": 148.3
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": true,
          "cost": 1.4874,
          "tokens": 431381,
          "time": 164.3
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": false,
          "cost": 1.2252,
          "tokens": 360254,
          "time": 164.7
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": true,
          "cost": 0.6705,
          "tokens": 189551,
          "time": 104.6
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": true,
          "cost": 0.7487,
          "tokens": 214886,
          "time": 126.2
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": true,
          "cost": 0.464,
          "tokens": 129405,
          "time": 93.8
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": true,
          "cost": 0.9951,
          "tokens": 282072,
          "time": 151.3
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": false,
          "cost": 1.3559,
          "tokens": 399002,
          "time": 168.2
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 1.6093,
          "tokens": 464457,
          "time": 185.5
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 1.2853,
          "tokens": 367539,
          "time": 170.9
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": true,
          "cost": 1.3333,
          "tokens": 395004,
          "time": 135.3
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": true,
          "cost": 1.8551,
          "tokens": 550165,
          "time": 184.8
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 1.3914,
          "tokens": 401511,
          "time": 162.6
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": false,
          "cost": 2.1765,
          "tokens": 630883,
          "time": 220.5
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 1.432,
          "tokens": 431865,
          "time": 136.8
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 1.0668,
          "tokens": 308609,
          "time": 119.0
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.619,
          "tokens": 170143,
          "time": 104.9
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": true,
          "cost": 0.4799,
          "tokens": 130030,
          "time": 102.3
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": true,
          "cost": 1.3125,
          "tokens": 386600,
          "time": 123.4
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": false,
          "cost": 1.6658,
          "tokens": 493448,
          "time": 156.5
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": false,
          "cost": 1.1502,
          "tokens": 334404,
          "time": 142.5
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": false,
          "cost": 1.0302,
          "tokens": 297066,
          "time": 136.5
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": false,
          "cost": 1.7499,
          "tokens": 521008,
          "time": 158.1
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 1.9866,
          "tokens": 589482,
          "time": 167.5
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": true,
          "cost": 2.7931,
          "tokens": 834950,
          "time": 256.4
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": true,
          "cost": 1.0553,
          "tokens": 292661,
          "time": 153.2
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": false,
          "cost": 1.8172,
          "tokens": 536110,
          "time": 188.0
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 1.1463,
          "tokens": 314587,
          "time": 156.2
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": true,
          "cost": 1.8913,
          "tokens": 553055,
          "time": 170.9
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": true,
          "cost": 0.6441,
          "tokens": 178042,
          "time": 112.1
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": true,
          "cost": 0.3312,
          "tokens": 89071,
          "time": 89.4
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": true,
          "cost": 2.2665,
          "tokens": 675496,
          "time": 194.3
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": false,
          "cost": 1.595,
          "tokens": 473842,
          "time": 149.4
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": true,
          "cost": 1.6923,
          "tokens": 505052,
          "time": 163.5
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": false,
          "cost": 2.634,
          "tokens": 781085,
          "time": 194.3
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": false,
          "cost": 2.102,
          "tokens": 631110,
          "time": 168.6
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": false,
          "cost": 3.4506,
          "tokens": 1035605,
          "time": 270.3
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": true,
          "cost": 2.6488,
          "tokens": 805100,
          "time": 192.1
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": true,
          "cost": 0.8997,
          "tokens": 257212,
          "time": 112.4
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": false,
          "cost": 3.0931,
          "tokens": 924109,
          "time": 247.8
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": false,
          "cost": 2.12,
          "tokens": 613545,
          "time": 225.7
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": true,
          "cost": 1.4381,
          "tokens": 391173,
          "time": 206.4
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": false,
          "cost": 2.77,
          "tokens": 856311,
          "time": 162.5
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": false,
          "cost": 1.4641,
          "tokens": 433969,
          "time": 150.6
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": false,
          "cost": 1.846,
          "tokens": 563837,
          "time": 136.3
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": false,
          "cost": 2.7908,
          "tokens": 867081,
          "time": 174.3
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": true,
          "cost": 1.149,
          "tokens": 327198,
          "time": 143.3
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": true,
          "cost": 0.9738,
          "tokens": 290164,
          "time": 108.7
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": true,
          "cost": 2.5944,
          "tokens": 793602,
          "time": 173.8
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": true,
          "cost": 0.4647,
          "tokens": 129709,
          "time": 80.6
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": true,
          "cost": 0.7483,
          "tokens": 206479,
          "time": 112.5
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": false,
          "cost": 2.0207,
          "tokens": 590532,
          "time": 214.7
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": false,
          "cost": 2.4374,
          "tokens": 737823,
          "time": 188.3
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": true,
          "cost": 1.9341,
          "tokens": 578166,
          "time": 154.0
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": true,
          "cost": 1.2651,
          "tokens": 363198,
          "time": 135.6
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": true,
          "cost": 2.3531,
          "tokens": 703320,
          "time": 177.4
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": false,
          "cost": 1.3639,
          "tokens": 381505,
          "time": 170.6
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": true,
          "cost": 0.8743,
          "tokens": 250610,
          "time": 110.6
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 1.6058,
          "tokens": 476909,
          "time": 146.2
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 0.5314,
          "tokens": 150456,
          "time": 87.3
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 0.5959,
          "tokens": 164295,
          "time": 117.9
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 1.7906,
          "tokens": 534999,
          "time": 182.8
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": false,
          "cost": 2.4038,
          "tokens": 696448,
          "time": 235.1
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": false,
          "cost": 2.0516,
          "tokens": 606527,
          "time": 187.1
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 1.0269,
          "tokens": 276482,
          "time": 183.1
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": false,
          "cost": 1.4205,
          "tokens": 416289,
          "time": 139.5
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": false,
          "cost": 1.5809,
          "tokens": 447906,
          "time": 191.0
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": false,
          "cost": 0.8365,
          "tokens": 239279,
          "time": 112.6
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": true,
          "cost": 1.5364,
          "tokens": 464011,
          "time": 137.6
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": false,
          "cost": 1.6131,
          "tokens": 469672,
          "time": 151.6
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": false,
          "cost": 1.7476,
          "tokens": 516263,
          "time": 180.6
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": true,
          "cost": 0.3891,
          "tokens": 106981,
          "time": 81.0
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 2.0647,
          "tokens": 610533,
          "time": 189.9
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 3.0412,
          "tokens": 913327,
          "time": 227.3
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": true,
          "cost": 1.1599,
          "tokens": 330235,
          "time": 133.4
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": true,
          "cost": 2.5296,
          "tokens": 758235,
          "time": 200.1
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": true,
          "cost": 0.3651,
          "tokens": 93752,
          "time": 91.1
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": true,
          "cost": 1.0221,
          "tokens": 292186,
          "time": 149.4
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 1.6021,
          "tokens": 468028,
          "time": 162.8
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": false,
          "cost": 3.007,
          "tokens": 904906,
          "time": 230.6
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 0.5994,
          "tokens": 168245,
          "time": 104.5
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": false,
          "cost": 1.4335,
          "tokens": 418274,
          "time": 156.9
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": false,
          "cost": 2.0516,
          "tokens": 600117,
          "time": 179.2
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": false,
          "cost": 3.7309,
          "tokens": 1118956,
          "time": 283.4
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": true,
          "cost": 2.1124,
          "tokens": 632362,
          "time": 192.6
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": true,
          "cost": 1.6132,
          "tokens": 475753,
          "time": 165.7
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": false,
          "cost": 1.7808,
          "tokens": 521588,
          "time": 170.3
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": false,
          "cost": 1.3149,
          "tokens": 374295,
          "time": 150.3
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 3.0056,
          "tokens": 911945,
          "time": 223.9
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 2.3451,
          "tokens": 717038,
          "time": 154.4
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 1.9412,
          "tokens": 583327,
          "time": 176.1
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": false,
          "cost": 1.8588,
          "tokens": 544916,
          "time": 172.7
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": false,
          "cost": 1.962,
          "tokens": 592574,
          "time": 172.4
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": true,
          "cost": 2.233,
          "tokens": 677887,
          "time": 171.2
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 1.3173,
          "tokens": 354808,
          "time": 202.5
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": true,
          "cost": 1.5455,
          "tokens": 436807,
          "time": 193.8
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": true,
          "cost": 1.2534,
          "tokens": 369292,
          "time": 137.1
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": false,
          "cost": 2.0045,
          "tokens": 583999,
          "time": 234.6
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": false,
          "cost": 2.6558,
          "tokens": 786655,
          "time": 237.3
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 1.0722,
          "tokens": 308011,
          "time": 136.0
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": true,
          "cost": 0.7888,
          "tokens": 223466,
          "time": 115.9
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": true,
          "cost": 0.5858,
          "tokens": 167812,
          "time": 90.3
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": true,
          "cost": 0.5346,
          "tokens": 148874,
          "time": 98.9
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": true,
          "cost": 1.116,
          "tokens": 321208,
          "time": 131.7
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": false,
          "cost": 4.1534,
          "tokens": 1230160,
          "time": 303.2
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 1.1877,
          "tokens": 347733,
          "time": 130.8
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 0.9559,
          "tokens": 259744,
          "time": 128.4
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.4901,
          "tokens": 129254,
          "time": 97.1
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": true,
          "cost": 1.4271,
          "tokens": 428993,
          "time": 141.0
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": false,
          "cost": 0.7562,
          "tokens": 215761,
          "time": 113.6
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": false,
          "cost": 1.7305,
          "tokens": 495941,
          "time": 202.6
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": true,
          "cost": 0.6709,
          "tokens": 175175,
          "time": 125.0
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": false,
          "cost": 1.1493,
          "tokens": 333462,
          "time": 120.3
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": true,
          "cost": 1.8843,
          "tokens": 568402,
          "time": 135.6
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 1.1759,
          "tokens": 321092,
          "time": 170.1
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": false,
          "cost": 0.8901,
          "tokens": 242361,
          "time": 139.2
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": false,
          "cost": 0.9529,
          "tokens": 263457,
          "time": 133.0
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": false,
          "cost": 3.598,
          "tokens": 1078610,
          "time": 260.2
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": false,
          "cost": 0.7674,
          "tokens": 208015,
          "time": 129.3
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 1.572,
          "tokens": 455350,
          "time": 162.1
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": false,
          "cost": 0.7348,
          "tokens": 207656,
          "time": 109.7
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 0.7478,
          "tokens": 210221,
          "time": 107.5
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 1.389,
          "tokens": 399170,
          "time": 165.3
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 1.3132,
          "tokens": 361212,
          "time": 179.1
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": true,
          "cost": 2.183,
          "tokens": 629200,
          "time": 199.8
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": false,
          "cost": 1.5684,
          "tokens": 463408,
          "time": 167.4
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 0.4466,
          "tokens": 121246,
          "time": 99.1
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": false,
          "cost": 1.9247,
          "tokens": 565631,
          "time": 161.8
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": false,
          "cost": 0.7393,
          "tokens": 199353,
          "time": 132.1
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 1.2882,
          "tokens": 376450,
          "time": 141.0
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 1.1263,
          "tokens": 314307,
          "time": 145.7
        }
      ]
    },
    {
      "runKey": "openclaw-deepseek-v4-pro",
      "harness": "openclaw",
      "model": "deepseek-v4-pro",
      "modelName": "deepseek-v4-pro",
      "reported": {
        "cost": 0.148,
        "tokens": 328000,
        "time": 317,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": false,
          "cost": 0.0676,
          "tokens": 149538,
          "time": 168.5
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": false,
          "cost": 0.0188,
          "tokens": 42563,
          "time": 210.3
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": false,
          "cost": 0.1777,
          "tokens": 398390,
          "time": 281.0
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": false,
          "cost": 0.1097,
          "tokens": 238908,
          "time": 366.6
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": false,
          "cost": 0.0685,
          "tokens": 151430,
          "time": 358.8
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": true,
          "cost": 0.1771,
          "tokens": 392571,
          "time": 349.6
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": true,
          "cost": 0.2036,
          "tokens": 454835,
          "time": 362.0
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": true,
          "cost": 0.1927,
          "tokens": 428964,
          "time": 469.3
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": true,
          "cost": 0.1665,
          "tokens": 368072,
          "time": 335.6
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": true,
          "cost": 0.114,
          "tokens": 255736,
          "time": 317.2
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": false,
          "cost": 0.0174,
          "tokens": 39544,
          "time": 212.6
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": false,
          "cost": 0.0259,
          "tokens": 59099,
          "time": 184.5
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": true,
          "cost": 0.1556,
          "tokens": 348982,
          "time": 280.0
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": false,
          "cost": 0.1522,
          "tokens": 343910,
          "time": 266.5
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": true,
          "cost": 0.1911,
          "tokens": 429673,
          "time": 372.8
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": false,
          "cost": 0.1863,
          "tokens": 415763,
          "time": 315.4
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 0.0613,
          "tokens": 138626,
          "time": 138.1
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": true,
          "cost": 0.1236,
          "tokens": 275721,
          "time": 258.2
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": false,
          "cost": 0.2255,
          "tokens": 504898,
          "time": 369.0
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": true,
          "cost": 0.4623,
          "tokens": 1040609,
          "time": 749.7
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 0.2068,
          "tokens": 464417,
          "time": 325.9
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": false,
          "cost": 0.1043,
          "tokens": 226074,
          "time": 331.1
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 0.2681,
          "tokens": 598375,
          "time": 534.2
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 0.101,
          "tokens": 225209,
          "time": 202.5
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": false,
          "cost": 0.0834,
          "tokens": 187107,
          "time": 199.8
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 0.1811,
          "tokens": 406519,
          "time": 303.4
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 0.1853,
          "tokens": 412898,
          "time": 397.2
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 0.1984,
          "tokens": 441845,
          "time": 412.8
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 0.2416,
          "tokens": 544493,
          "time": 325.2
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 0.2012,
          "tokens": 457835,
          "time": 222.3
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": true,
          "cost": 0.1102,
          "tokens": 246063,
          "time": 234.9
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": true,
          "cost": 0.1623,
          "tokens": 357016,
          "time": 387.7
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": true,
          "cost": 0.1545,
          "tokens": 339662,
          "time": 380.4
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": true,
          "cost": 0.1782,
          "tokens": 394026,
          "time": 390.1
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 0.2389,
          "tokens": 529510,
          "time": 456.5
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": false,
          "cost": 0.0287,
          "tokens": 64544,
          "time": 146.1
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 0.2698,
          "tokens": 599035,
          "time": 485.2
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 0.0509,
          "tokens": 114801,
          "time": 154.6
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": false,
          "cost": 0.2211,
          "tokens": 491600,
          "time": 418.0
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 0.2461,
          "tokens": 552449,
          "time": 347.3
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": true,
          "cost": 0.1784,
          "tokens": 394262,
          "time": 391.8
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 0.174,
          "tokens": 391280,
          "time": 284.9
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": false,
          "cost": 0.1149,
          "tokens": 253894,
          "time": 287.9
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": false,
          "cost": 0.152,
          "tokens": 339844,
          "time": 329.5
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": false,
          "cost": 0.0431,
          "tokens": 96951,
          "time": 141.1
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": true,
          "cost": 0.1486,
          "tokens": 328308,
          "time": 462.0
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": true,
          "cost": 0.0689,
          "tokens": 151694,
          "time": 184.5
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": false,
          "cost": 0.1111,
          "tokens": 245500,
          "time": 240.3
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": true,
          "cost": 0.1053,
          "tokens": 234742,
          "time": 245.8
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": true,
          "cost": 0.1453,
          "tokens": 324181,
          "time": 478.8
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": true,
          "cost": 0.1958,
          "tokens": 436964,
          "time": 354.2
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": false,
          "cost": 0.1588,
          "tokens": 351818,
          "time": 320.5
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": true,
          "cost": 0.1247,
          "tokens": 274010,
          "time": 331.4
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": true,
          "cost": 0.2302,
          "tokens": 506884,
          "time": 555.9
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 0.0916,
          "tokens": 199555,
          "time": 291.5
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 0.0172,
          "tokens": 39096,
          "time": 58.3
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 0.1104,
          "tokens": 247317,
          "time": 196.6
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": false,
          "cost": 0.1979,
          "tokens": 442153,
          "time": 488.7
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 0.1631,
          "tokens": 361888,
          "time": 355.6
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": false,
          "cost": 0.0888,
          "tokens": 192851,
          "time": 294.2
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": true,
          "cost": 0.1046,
          "tokens": 234351,
          "time": 202.8
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 0.1354,
          "tokens": 302441,
          "time": 265.2
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": false,
          "cost": 0.125,
          "tokens": 274953,
          "time": 389.0
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": false,
          "cost": 0.1759,
          "tokens": 386237,
          "time": 392.9
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": true,
          "cost": 0.1105,
          "tokens": 240214,
          "time": 323.2
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": false,
          "cost": 0.0542,
          "tokens": 121331,
          "time": 156.6
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": false,
          "cost": 0.1053,
          "tokens": 232276,
          "time": 305.7
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": true,
          "cost": 0.0992,
          "tokens": 218816,
          "time": 307.1
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": true,
          "cost": 0.1525,
          "tokens": 339604,
          "time": 279.6
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": false,
          "cost": 0.1402,
          "tokens": 314275,
          "time": 236.1
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": true,
          "cost": 0.3309,
          "tokens": 729174,
          "time": 661.7
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 0.1465,
          "tokens": 329865,
          "time": 247.7
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 0.1966,
          "tokens": 438429,
          "time": 404.2
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": false,
          "cost": 0.2816,
          "tokens": 630858,
          "time": 458.8
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": true,
          "cost": 0.075,
          "tokens": 164358,
          "time": 219.1
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 0.2311,
          "tokens": 516537,
          "time": 398.6
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": false,
          "cost": 0.1998,
          "tokens": 443413,
          "time": 529.0
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 0.1369,
          "tokens": 301818,
          "time": 351.6
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 0.1384,
          "tokens": 312684,
          "time": 251.3
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.1491,
          "tokens": 333307,
          "time": 326.2
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": true,
          "cost": 0.2345,
          "tokens": 518966,
          "time": 458.6
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": true,
          "cost": 0.0616,
          "tokens": 133330,
          "time": 225.8
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": true,
          "cost": 0.1375,
          "tokens": 303483,
          "time": 302.6
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": true,
          "cost": 0.1799,
          "tokens": 401109,
          "time": 360.0
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": true,
          "cost": 0.1469,
          "tokens": 324872,
          "time": 339.3
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": true,
          "cost": 0.1189,
          "tokens": 258843,
          "time": 334.4
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 0.1921,
          "tokens": 428602,
          "time": 342.2
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": true,
          "cost": 0.2079,
          "tokens": 461652,
          "time": 471.1
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": false,
          "cost": 0.1132,
          "tokens": 250899,
          "time": 253.0
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": false,
          "cost": 0.126,
          "tokens": 278907,
          "time": 299.5
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 0.2061,
          "tokens": 459835,
          "time": 361.5
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": true,
          "cost": 0.1081,
          "tokens": 238758,
          "time": 257.2
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": true,
          "cost": 0.159,
          "tokens": 349211,
          "time": 417.9
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": true,
          "cost": 0.1327,
          "tokens": 295090,
          "time": 262.0
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": true,
          "cost": 0.2196,
          "tokens": 492133,
          "time": 407.2
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": false,
          "cost": 0.1912,
          "tokens": 425809,
          "time": 371.5
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": false,
          "cost": 0.017,
          "tokens": 38921,
          "time": 68.3
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": false,
          "cost": 0.3035,
          "tokens": 678225,
          "time": 396.2
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": true,
          "cost": 0.4226,
          "tokens": 943655,
          "time": 652.9
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": true,
          "cost": 0.4186,
          "tokens": 938213,
          "time": 631.7
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": false,
          "cost": 0.2527,
          "tokens": 556833,
          "time": 525.7
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": true,
          "cost": 0.1126,
          "tokens": 252552,
          "time": 249.2
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": false,
          "cost": 0.2465,
          "tokens": 552273,
          "time": 350.1
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": false,
          "cost": 0.1487,
          "tokens": 330693,
          "time": 330.7
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": false,
          "cost": 0.1874,
          "tokens": 415614,
          "time": 382.7
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": false,
          "cost": 0.0586,
          "tokens": 130178,
          "time": 140.3
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": false,
          "cost": 0.3193,
          "tokens": 710541,
          "time": 560.5
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": true,
          "cost": 0.2476,
          "tokens": 547823,
          "time": 447.5
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": false,
          "cost": 0.3275,
          "tokens": 729689,
          "time": 576.2
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": false,
          "cost": 0.0787,
          "tokens": 176790,
          "time": 199.2
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": true,
          "cost": 0.1845,
          "tokens": 407125,
          "time": 465.6
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": false,
          "cost": 0.2041,
          "tokens": 452228,
          "time": 493.9
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": false,
          "cost": 0.0628,
          "tokens": 140087,
          "time": 154.9
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": false,
          "cost": 0.1703,
          "tokens": 377688,
          "time": 347.3
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": false,
          "cost": 0.0919,
          "tokens": 204989,
          "time": 187.1
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": true,
          "cost": 0.2325,
          "tokens": 519008,
          "time": 384.8
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": true,
          "cost": 0.2823,
          "tokens": 632039,
          "time": 397.4
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": true,
          "cost": 0.122,
          "tokens": 272156,
          "time": 288.7
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": true,
          "cost": 0.1091,
          "tokens": 239993,
          "time": 332.1
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": false,
          "cost": 0.1981,
          "tokens": 444987,
          "time": 318.6
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": true,
          "cost": 0.1037,
          "tokens": 229167,
          "time": 255.2
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 0.0254,
          "tokens": 57792,
          "time": 69.8
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": false,
          "cost": 0.0638,
          "tokens": 144824,
          "time": 104.0
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": false,
          "cost": 0.0417,
          "tokens": 92859,
          "time": 93.0
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": true,
          "cost": 0.1728,
          "tokens": 380162,
          "time": 520.1
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": false,
          "cost": 0.1898,
          "tokens": 419708,
          "time": 388.3
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": false,
          "cost": 0.0315,
          "tokens": 70804,
          "time": 82.2
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 0.1354,
          "tokens": 300887,
          "time": 408.1
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": false,
          "cost": 0.0254,
          "tokens": 57870,
          "time": 71.1
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": false,
          "cost": 0.2573,
          "tokens": 581964,
          "time": 330.0
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": false,
          "cost": 0.1279,
          "tokens": 288050,
          "time": 229.0
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": false,
          "cost": 0.1899,
          "tokens": 422321,
          "time": 358.9
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": true,
          "cost": 0.1325,
          "tokens": 293035,
          "time": 309.6
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": false,
          "cost": 0.1585,
          "tokens": 354074,
          "time": 285.9
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": true,
          "cost": 0.1849,
          "tokens": 411964,
          "time": 294.8
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 0.0453,
          "tokens": 101196,
          "time": 114.2
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 0.1581,
          "tokens": 351424,
          "time": 359.7
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": false,
          "cost": 0.0344,
          "tokens": 72352,
          "time": 185.9
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": false,
          "cost": 0.0912,
          "tokens": 203904,
          "time": 157.2
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": false,
          "cost": 0.1023,
          "tokens": 231660,
          "time": 168.8
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": false,
          "cost": 0.0982,
          "tokens": 222475,
          "time": 140.1
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 0.1224,
          "tokens": 276263,
          "time": 182.0
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": false,
          "cost": 0.1391,
          "tokens": 309181,
          "time": 293.5
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 0.1572,
          "tokens": 350692,
          "time": 413.0
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": false,
          "cost": 0.2274,
          "tokens": 510071,
          "time": 349.7
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": true,
          "cost": 0.2368,
          "tokens": 527613,
          "time": 456.4
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": false,
          "cost": 0.1126,
          "tokens": 255501,
          "time": 149.2
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": true,
          "cost": 0.1795,
          "tokens": 401668,
          "time": 317.3
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": true,
          "cost": 0.1397,
          "tokens": 310712,
          "time": 350.6
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": false,
          "cost": 0.1278,
          "tokens": 282056,
          "time": 320.1
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": true,
          "cost": 0.2261,
          "tokens": 504705,
          "time": 408.9
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 0.0377,
          "tokens": 85499,
          "time": 83.0
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 0.0948,
          "tokens": 208101,
          "time": 261.7
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 0.0534,
          "tokens": 120500,
          "time": 148.9
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": false,
          "cost": 0.0171,
          "tokens": 39042,
          "time": 56.0
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": false,
          "cost": 0.0903,
          "tokens": 204819,
          "time": 181.6
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": true,
          "cost": 0.1557,
          "tokens": 344608,
          "time": 313.5
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 0.1694,
          "tokens": 375193,
          "time": 384.5
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": true,
          "cost": 0.2125,
          "tokens": 474189,
          "time": 421.2
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": true,
          "cost": 0.153,
          "tokens": 337228,
          "time": 361.1
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": false,
          "cost": 0.1259,
          "tokens": 280811,
          "time": 267.7
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": true,
          "cost": 0.1541,
          "tokens": 337990,
          "time": 370.3
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 0.1176,
          "tokens": 261624,
          "time": 227.7
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": false,
          "cost": 0.0508,
          "tokens": 114550,
          "time": 104.6
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": true,
          "cost": 0.135,
          "tokens": 297821,
          "time": 388.1
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": true,
          "cost": 0.1628,
          "tokens": 352109,
          "time": 480.8
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": true,
          "cost": 0.1156,
          "tokens": 249796,
          "time": 336.6
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": true,
          "cost": 0.1135,
          "tokens": 246172,
          "time": 359.3
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 0.092,
          "tokens": 202782,
          "time": 208.1
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 0.1266,
          "tokens": 278028,
          "time": 295.5
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.1379,
          "tokens": 305048,
          "time": 307.8
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": false,
          "cost": 0.0941,
          "tokens": 211925,
          "time": 154.7
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": true,
          "cost": 0.1453,
          "tokens": 319582,
          "time": 366.5
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": false,
          "cost": 0.0437,
          "tokens": 98813,
          "time": 90.2
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": false,
          "cost": 0.0504,
          "tokens": 113803,
          "time": 105.7
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": true,
          "cost": 0.1074,
          "tokens": 239174,
          "time": 235.8
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": true,
          "cost": 0.0958,
          "tokens": 209155,
          "time": 251.2
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 0.1162,
          "tokens": 253090,
          "time": 314.5
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": false,
          "cost": 0.0619,
          "tokens": 136244,
          "time": 229.1
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": false,
          "cost": 0.0475,
          "tokens": 98170,
          "time": 140.3
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": true,
          "cost": 0.3025,
          "tokens": 668406,
          "time": 739.8
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": true,
          "cost": 0.1179,
          "tokens": 260599,
          "time": 310.8
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 0.2737,
          "tokens": 618537,
          "time": 335.0
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": false,
          "cost": 0.1636,
          "tokens": 364406,
          "time": 317.7
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 0.0853,
          "tokens": 187972,
          "time": 281.8
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 0.1959,
          "tokens": 426635,
          "time": 628.1
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 0.1493,
          "tokens": 331110,
          "time": 389.6
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": false,
          "cost": 0.1717,
          "tokens": 379993,
          "time": 368.9
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": false,
          "cost": 0.175,
          "tokens": 385819,
          "time": 403.7
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 0.1061,
          "tokens": 235270,
          "time": 239.5
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": true,
          "cost": 0.0919,
          "tokens": 201248,
          "time": 258.5
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": false,
          "cost": 0.1161,
          "tokens": 254773,
          "time": 291.7
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 0.0859,
          "tokens": 187416,
          "time": 263.3
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 0.0967,
          "tokens": 218467,
          "time": 245.7
        }
      ]
    },
    {
      "runKey": "openclaw-haiku-4.5",
      "harness": "openclaw",
      "model": "claude-haiku-4.5",
      "modelName": "claude-haiku-4.5",
      "reported": {
        "cost": 1.022,
        "tokens": 932000,
        "time": 155,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": true,
          "cost": 1.6169,
          "tokens": 1508461,
          "time": 235.2
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": false,
          "cost": 0.6938,
          "tokens": 627068,
          "time": 146.2
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": false,
          "cost": 1.811,
          "tokens": 1710586,
          "time": 210.4
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": false,
          "cost": 1.5865,
          "tokens": 1472081,
          "time": 211.6
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": false,
          "cost": 0.7404,
          "tokens": 666941,
          "time": 159.5
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": false,
          "cost": 1.1658,
          "tokens": 1030465,
          "time": 261.2
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": true,
          "cost": 1.2327,
          "tokens": 1144847,
          "time": 174.1
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": true,
          "cost": 1.6623,
          "tokens": 1501753,
          "time": 294.6
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": true,
          "cost": 0.6237,
          "tokens": 550822,
          "time": 137.2
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": true,
          "cost": 0.6736,
          "tokens": 608964,
          "time": 110.2
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": true,
          "cost": 0.862,
          "tokens": 795621,
          "time": 148.9
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": false,
          "cost": 0.808,
          "tokens": 720698,
          "time": 150.8
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": true,
          "cost": 0.457,
          "tokens": 403960,
          "time": 116.1
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": true,
          "cost": 0.7653,
          "tokens": 698396,
          "time": 136.1
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": false,
          "cost": 0.7657,
          "tokens": 694740,
          "time": 137.0
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": true,
          "cost": 0.5637,
          "tokens": 513728,
          "time": 116.3
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 1.4059,
          "tokens": 1297267,
          "time": 212.7
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": true,
          "cost": 1.0032,
          "tokens": 902986,
          "time": 170.6
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": false,
          "cost": 1.2651,
          "tokens": 1170193,
          "time": 169.7
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": false,
          "cost": 1.4135,
          "tokens": 1312713,
          "time": 191.3
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 1.7488,
          "tokens": 1637327,
          "time": 186.9
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": false,
          "cost": 0.6411,
          "tokens": 572069,
          "time": 146.1
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 0.9683,
          "tokens": 883112,
          "time": 180.0
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 0.847,
          "tokens": 767207,
          "time": 137.8
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": false,
          "cost": 1.6981,
          "tokens": 1542344,
          "time": 259.5
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 1.5837,
          "tokens": 1474036,
          "time": 177.3
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 0.4205,
          "tokens": 361348,
          "time": 112.8
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 1.7167,
          "tokens": 1587305,
          "time": 228.8
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 0.7838,
          "tokens": 713128,
          "time": 146.5
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 0.6971,
          "tokens": 638664,
          "time": 118.1
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": true,
          "cost": 0.9859,
          "tokens": 905641,
          "time": 149.8
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": false,
          "cost": 1.1946,
          "tokens": 1093446,
          "time": 184.1
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": false,
          "cost": 1.4065,
          "tokens": 1274994,
          "time": 220.6
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": false,
          "cost": 1.7036,
          "tokens": 1572916,
          "time": 216.7
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 1.6307,
          "tokens": 1517124,
          "time": 214.6
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": false,
          "cost": 0.6678,
          "tokens": 595287,
          "time": 134.6
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 1.3476,
          "tokens": 1254257,
          "time": 162.1
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 0.2681,
          "tokens": 234489,
          "time": 87.6
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": false,
          "cost": 0.6691,
          "tokens": 593483,
          "time": 140.8
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 0.6898,
          "tokens": 627802,
          "time": 117.9
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": false,
          "cost": 1.0468,
          "tokens": 952755,
          "time": 154.8
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 0.5017,
          "tokens": 447636,
          "time": 105.9
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": false,
          "cost": 0.6926,
          "tokens": 609426,
          "time": 143.9
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": false,
          "cost": 0.6172,
          "tokens": 545515,
          "time": 123.6
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": false,
          "cost": 0.821,
          "tokens": 738607,
          "time": 134.4
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 1.2593,
          "tokens": 1162145,
          "time": 174.1
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": false,
          "cost": 0.7726,
          "tokens": 674998,
          "time": 165.3
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": false,
          "cost": 0.7035,
          "tokens": 629288,
          "time": 160.8
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": true,
          "cost": 0.5503,
          "tokens": 495877,
          "time": 106.7
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": false,
          "cost": 1.2542,
          "tokens": 1123481,
          "time": 221.9
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": false,
          "cost": 1.1848,
          "tokens": 1075486,
          "time": 198.2
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": false,
          "cost": 0.6159,
          "tokens": 564896,
          "time": 91.4
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": false,
          "cost": 0.9994,
          "tokens": 898529,
          "time": 188.3
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": true,
          "cost": 1.2613,
          "tokens": 1148547,
          "time": 209.4
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 0.4978,
          "tokens": 443858,
          "time": 115.3
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 0.4779,
          "tokens": 427082,
          "time": 96.0
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": false,
          "cost": 0.7177,
          "tokens": 641107,
          "time": 121.0
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": false,
          "cost": 0.5861,
          "tokens": 488843,
          "time": 180.5
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 1.1145,
          "tokens": 1041476,
          "time": 145.8
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": true,
          "cost": 1.1626,
          "tokens": 1069941,
          "time": 182.6
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": false,
          "cost": 0.2863,
          "tokens": 235308,
          "time": 96.1
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 1.5358,
          "tokens": 1420442,
          "time": 173.7
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": true,
          "cost": 1.4903,
          "tokens": 1350522,
          "time": 239.6
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": false,
          "cost": 0.6784,
          "tokens": 592646,
          "time": 146.8
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": true,
          "cost": 1.4488,
          "tokens": 1350745,
          "time": 155.6
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": false,
          "cost": 0.9277,
          "tokens": 827371,
          "time": 197.5
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": false,
          "cost": 2.0222,
          "tokens": 1918661,
          "time": 193.1
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": false,
          "cost": 1.0877,
          "tokens": 971373,
          "time": 197.3
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": true,
          "cost": 0.7773,
          "tokens": 713340,
          "time": 118.2
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": false,
          "cost": 0.6197,
          "tokens": 539012,
          "time": 131.0
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": true,
          "cost": 0.4401,
          "tokens": 392070,
          "time": 108.1
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": false,
          "cost": 1.7012,
          "tokens": 1565522,
          "time": 233.8
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 1.2899,
          "tokens": 1190740,
          "time": 152.3
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 0.3578,
          "tokens": 317685,
          "time": 96.6
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": false,
          "cost": 0.9205,
          "tokens": 834430,
          "time": 153.8
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": true,
          "cost": 0.7483,
          "tokens": 661503,
          "time": 146.0
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 0.9174,
          "tokens": 833676,
          "time": 157.1
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": false,
          "cost": 1.6326,
          "tokens": 1484652,
          "time": 237.4
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 0.4476,
          "tokens": 393044,
          "time": 103.7
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 0.3172,
          "tokens": 280796,
          "time": 109.8
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.6476,
          "tokens": 571484,
          "time": 144.7
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": true,
          "cost": 0.7638,
          "tokens": 703138,
          "time": 115.5
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": true,
          "cost": 0.3856,
          "tokens": 344094,
          "time": 101.3
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": false,
          "cost": 0.9493,
          "tokens": 868228,
          "time": 136.7
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": false,
          "cost": 0.9723,
          "tokens": 888138,
          "time": 151.0
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": true,
          "cost": 1.6045,
          "tokens": 1497863,
          "time": 182.4
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": false,
          "cost": 1.4573,
          "tokens": 1340126,
          "time": 178.6
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 0.6161,
          "tokens": 547860,
          "time": 167.1
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": true,
          "cost": 0.6922,
          "tokens": 610935,
          "time": 136.5
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": true,
          "cost": 2.6633,
          "tokens": 2441538,
          "time": 312.0
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": false,
          "cost": 1.0267,
          "tokens": 947240,
          "time": 160.3
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 1.0325,
          "tokens": 955097,
          "time": 139.3
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": true,
          "cost": 0.3781,
          "tokens": 337202,
          "time": 98.8
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": true,
          "cost": 1.2436,
          "tokens": 1124987,
          "time": 202.9
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": true,
          "cost": 0.6849,
          "tokens": 616023,
          "time": 119.2
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": false,
          "cost": 0.9871,
          "tokens": 911897,
          "time": 139.5
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": true,
          "cost": 0.3938,
          "tokens": 348718,
          "time": 96.1
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": true,
          "cost": 1.4212,
          "tokens": 1297629,
          "time": 187.8
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": false,
          "cost": 0.5614,
          "tokens": 507273,
          "time": 107.1
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": false,
          "cost": 2.9112,
          "tokens": 2690039,
          "time": 350.2
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": false,
          "cost": 2.1266,
          "tokens": 1991281,
          "time": 305.0
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": false,
          "cost": 1.2688,
          "tokens": 1154085,
          "time": 264.3
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": false,
          "cost": 2.3747,
          "tokens": 2212223,
          "time": 306.8
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": false,
          "cost": 1.4144,
          "tokens": 1332881,
          "time": 223.1
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": false,
          "cost": 1.5495,
          "tokens": 1416482,
          "time": 291.8
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": false,
          "cost": 1.6821,
          "tokens": 1571557,
          "time": 237.5
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": false,
          "cost": 0.8033,
          "tokens": 738860,
          "time": 153.9
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": false,
          "cost": 0.4821,
          "tokens": 426606,
          "time": 125.7
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": true,
          "cost": 1.7606,
          "tokens": 1666243,
          "time": 222.3
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": false,
          "cost": 0.1351,
          "tokens": 106885,
          "time": 83.7
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": false,
          "cost": 0.9067,
          "tokens": 832063,
          "time": 137.8
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": true,
          "cost": 0.6731,
          "tokens": 597728,
          "time": 120.6
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": false,
          "cost": 2.0565,
          "tokens": 1911113,
          "time": 242.8
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": true,
          "cost": 1.0611,
          "tokens": 980812,
          "time": 124.5
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": true,
          "cost": 0.7451,
          "tokens": 676638,
          "time": 122.7
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": false,
          "cost": 0.9038,
          "tokens": 830756,
          "time": 126.1
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": true,
          "cost": 1.17,
          "tokens": 1075233,
          "time": 152.0
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": false,
          "cost": 1.0151,
          "tokens": 918156,
          "time": 159.9
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": false,
          "cost": 2.4877,
          "tokens": 2347311,
          "time": 306.9
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": true,
          "cost": 0.3394,
          "tokens": 298854,
          "time": 83.9
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": false,
          "cost": 1.8491,
          "tokens": 1659586,
          "time": 290.0
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": false,
          "cost": 1.1848,
          "tokens": 1095233,
          "time": 154.7
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 0.4884,
          "tokens": 437594,
          "time": 98.0
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 0.4462,
          "tokens": 389981,
          "time": 99.5
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 1.1277,
          "tokens": 1023536,
          "time": 170.7
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 0.6681,
          "tokens": 579259,
          "time": 143.7
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": true,
          "cost": 1.1805,
          "tokens": 1066084,
          "time": 228.0
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": true,
          "cost": 0.6706,
          "tokens": 617369,
          "time": 124.9
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 0.2836,
          "tokens": 240919,
          "time": 95.8
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": false,
          "cost": 0.4574,
          "tokens": 407783,
          "time": 102.5
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": true,
          "cost": 0.7715,
          "tokens": 697216,
          "time": 139.2
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": false,
          "cost": 0.4083,
          "tokens": 363775,
          "time": 100.0
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": true,
          "cost": 0.9072,
          "tokens": 836772,
          "time": 144.9
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": false,
          "cost": 0.676,
          "tokens": 613140,
          "time": 119.0
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": false,
          "cost": 0.3788,
          "tokens": 324606,
          "time": 103.1
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": true,
          "cost": 0.5527,
          "tokens": 499096,
          "time": 107.2
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 0.7511,
          "tokens": 674476,
          "time": 138.5
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 1.7838,
          "tokens": 1622088,
          "time": 317.2
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": true,
          "cost": 1.2654,
          "tokens": 1171461,
          "time": 198.6
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": true,
          "cost": 0.624,
          "tokens": 562169,
          "time": 108.0
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": false,
          "cost": 0.3048,
          "tokens": 258280,
          "time": 104.8
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": true,
          "cost": 1.0386,
          "tokens": 952387,
          "time": 163.4
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 1.1465,
          "tokens": 1027323,
          "time": 212.6
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": false,
          "cost": 1.0251,
          "tokens": 939543,
          "time": 192.6
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 0.8993,
          "tokens": 809616,
          "time": 197.7
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": true,
          "cost": 0.4983,
          "tokens": 444448,
          "time": 126.3
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": false,
          "cost": 1.1648,
          "tokens": 1018834,
          "time": 247.8
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": false,
          "cost": 0.9416,
          "tokens": 876282,
          "time": 164.0
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": false,
          "cost": 0.9476,
          "tokens": 869595,
          "time": 268.6
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": false,
          "cost": 1.3577,
          "tokens": 1246852,
          "time": 223.0
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": false,
          "cost": 0.5324,
          "tokens": 482856,
          "time": 119.5
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": false,
          "cost": 3.0108,
          "tokens": 2827514,
          "time": 377.4
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 2.7395,
          "tokens": 2559159,
          "time": 392.1
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 0.4688,
          "tokens": 417091,
          "time": 176.0
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 0.897,
          "tokens": 821128,
          "time": 167.7
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": false,
          "cost": 0.8056,
          "tokens": 740565,
          "time": 143.8
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": false,
          "cost": 1.1489,
          "tokens": 1063217,
          "time": 185.6
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": true,
          "cost": 0.4296,
          "tokens": 390932,
          "time": 108.1
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 0.8435,
          "tokens": 765572,
          "time": 163.8
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": false,
          "cost": 0.7419,
          "tokens": 655277,
          "time": 160.5
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": false,
          "cost": 0.7545,
          "tokens": 680677,
          "time": 122.6
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": false,
          "cost": 1.4206,
          "tokens": 1292615,
          "time": 238.8
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": false,
          "cost": 2.0197,
          "tokens": 1855861,
          "time": 324.0
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 0.595,
          "tokens": 527959,
          "time": 140.9
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": true,
          "cost": 0.8899,
          "tokens": 813459,
          "time": 157.6
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": true,
          "cost": 0.7216,
          "tokens": 631387,
          "time": 182.2
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": true,
          "cost": 0.6038,
          "tokens": 519316,
          "time": 160.8
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": false,
          "cost": 2.2595,
          "tokens": 2085713,
          "time": 305.0
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": true,
          "cost": 0.1855,
          "tokens": 161803,
          "time": 83.7
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 0.6766,
          "tokens": 599278,
          "time": 170.3
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 0.5117,
          "tokens": 457503,
          "time": 120.2
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.2096,
          "tokens": 175787,
          "time": 79.7
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": false,
          "cost": 0.7465,
          "tokens": 643808,
          "time": 198.1
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": false,
          "cost": 1.1865,
          "tokens": 1089394,
          "time": 181.1
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": false,
          "cost": 0.3342,
          "tokens": 286993,
          "time": 108.4
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": false,
          "cost": 1.2126,
          "tokens": 1115178,
          "time": 192.5
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": false,
          "cost": 0.8172,
          "tokens": 748961,
          "time": 142.6
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": true,
          "cost": 0.3299,
          "tokens": 294884,
          "time": 86.0
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 2.0873,
          "tokens": 1928343,
          "time": 286.3
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": false,
          "cost": 0.2103,
          "tokens": 169218,
          "time": 89.4
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": false,
          "cost": 1.2518,
          "tokens": 1131876,
          "time": 217.0
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": false,
          "cost": 1.7354,
          "tokens": 1588321,
          "time": 280.6
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": true,
          "cost": 0.7831,
          "tokens": 709895,
          "time": 145.5
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 0.967,
          "tokens": 894055,
          "time": 162.9
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": true,
          "cost": 1.6771,
          "tokens": 1506414,
          "time": 276.8
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": true,
          "cost": 1.1204,
          "tokens": 1019137,
          "time": 181.3
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": true,
          "cost": 0.5831,
          "tokens": 512241,
          "time": 162.1
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": true,
          "cost": 0.6853,
          "tokens": 624886,
          "time": 149.7
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": false,
          "cost": 1.8677,
          "tokens": 1710382,
          "time": 260.1
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": false,
          "cost": 0.8834,
          "tokens": 802513,
          "time": 158.6
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 0.7206,
          "tokens": 659354,
          "time": 128.9
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": false,
          "cost": 0.71,
          "tokens": 645689,
          "time": 136.9
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": false,
          "cost": 0.5582,
          "tokens": 493450,
          "time": 129.7
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 2.4612,
          "tokens": 2255957,
          "time": 331.4
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 2.4792,
          "tokens": 2281641,
          "time": 322.2
        }
      ]
    },
    {
      "runKey": "rlm-gpt-5",
      "harness": "trace-rlm",
      "model": "gpt-5",
      "modelName": "gpt-5",
      "reported": {
        "cost": 0.4,
        "tokens": 473000,
        "time": 374,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": false,
          "cost": 0.121,
          "tokens": 72921,
          "time": 173.0
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": true,
          "cost": 0.4427,
          "tokens": 413244,
          "time": 391.0
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": false,
          "cost": 0.573,
          "tokens": 530637,
          "time": 430.8
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": false,
          "cost": 0.2636,
          "tokens": 173329,
          "time": 317.8
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": false,
          "cost": 0.272,
          "tokens": 176669,
          "time": 305.4
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": false,
          "cost": 0.3333,
          "tokens": 244141,
          "time": 302.9
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": false,
          "cost": 1.2441,
          "tokens": 3846351,
          "time": 1232.0
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": true,
          "cost": 0.3725,
          "tokens": 307021,
          "time": 311.4
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": true,
          "cost": 0.3068,
          "tokens": 205779,
          "time": 328.5
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": true,
          "cost": 0.2922,
          "tokens": 208853,
          "time": 282.2
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": false,
          "cost": 0.2889,
          "tokens": 227599,
          "time": 311.4
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": true,
          "cost": 0.456,
          "tokens": 354263,
          "time": 394.8
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": false,
          "cost": 0.5518,
          "tokens": 560710,
          "time": 426.7
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": false,
          "cost": 0.3406,
          "tokens": 277449,
          "time": 382.1
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": false,
          "cost": 0.4147,
          "tokens": 370274,
          "time": 323.6
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": false,
          "cost": 0.3222,
          "tokens": 292171,
          "time": 494.7
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 0.4701,
          "tokens": 385281,
          "time": 421.1
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": false,
          "cost": 0.1018,
          "tokens": 46431,
          "time": 179.6
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": false,
          "cost": 0.3783,
          "tokens": 387916,
          "time": 384.1
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": false,
          "cost": 0.3583,
          "tokens": 242855,
          "time": 321.8
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 0.6181,
          "tokens": 769923,
          "time": 420.0
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": false,
          "cost": 0.1475,
          "tokens": 77298,
          "time": 197.7
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 0.524,
          "tokens": 500903,
          "time": 364.5
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 0.3907,
          "tokens": 629890,
          "time": 716.6
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": true,
          "cost": 0.8809,
          "tokens": 1666565,
          "time": 710.8
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 0.3235,
          "tokens": 267424,
          "time": 318.0
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 0.2231,
          "tokens": 152976,
          "time": 251.4
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 0.6511,
          "tokens": 2028983,
          "time": 526.9
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 0.5568,
          "tokens": 526579,
          "time": 516.1
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 0.4318,
          "tokens": 340273,
          "time": 402.2
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": true,
          "cost": 0.2529,
          "tokens": 200306,
          "time": 318.2
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": false,
          "cost": 0.7247,
          "tokens": 766795,
          "time": 468.2
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": false,
          "cost": 0.1771,
          "tokens": 97103,
          "time": 214.3
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": false,
          "cost": 0.859,
          "tokens": 782435,
          "time": 738.2
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": true,
          "cost": 0.9006,
          "tokens": 1263682,
          "time": 817.4
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": false,
          "cost": 0.3778,
          "tokens": 317611,
          "time": 313.3
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 0.1964,
          "tokens": 86484,
          "time": 349.2
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 0.4767,
          "tokens": 373964,
          "time": 569.2
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": false,
          "cost": 0.4318,
          "tokens": 317046,
          "time": 487.0
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 0.3326,
          "tokens": 243382,
          "time": 360.5
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": false,
          "cost": 0.2834,
          "tokens": 198266,
          "time": 285.9
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 0.2761,
          "tokens": 330726,
          "time": 723.8
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": false,
          "cost": 0.2764,
          "tokens": 180689,
          "time": 303.9
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": true,
          "cost": 0.2869,
          "tokens": 422818,
          "time": 382.8
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": false,
          "cost": 0.3876,
          "tokens": 281344,
          "time": 417.5
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 0.2699,
          "tokens": 160365,
          "time": 355.9
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": true,
          "cost": 0.1942,
          "tokens": 120864,
          "time": 236.1
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": false,
          "cost": 0.1365,
          "tokens": 86815,
          "time": 136.7
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": true,
          "cost": 0.1603,
          "tokens": 99684,
          "time": 170.5
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": false,
          "cost": 0.3136,
          "tokens": 256264,
          "time": 272.9
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": true,
          "cost": 0.3786,
          "tokens": 359439,
          "time": 412.3
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": false,
          "cost": 0.1389,
          "tokens": 140969,
          "time": 184.7
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": true,
          "cost": 0.2543,
          "tokens": 281568,
          "time": 631.5
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": true,
          "cost": 1.0954,
          "tokens": 3066248,
          "time": 879.6
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 0.6261,
          "tokens": 671262,
          "time": 529.8
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 0.2649,
          "tokens": 165161,
          "time": 295.4
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 0.2531,
          "tokens": 187820,
          "time": 257.8
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": true,
          "cost": 0.3511,
          "tokens": 231528,
          "time": 233.5
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 0.5453,
          "tokens": 554974,
          "time": 477.6
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": true,
          "cost": 0.3517,
          "tokens": 304026,
          "time": 254.4
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": false,
          "cost": 0.2424,
          "tokens": 158041,
          "time": 272.8
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 0.5745,
          "tokens": 659869,
          "time": 650.4
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": true,
          "cost": 0.5319,
          "tokens": 575630,
          "time": 442.6
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": false,
          "cost": 0.8072,
          "tokens": 1187568,
          "time": 685.0
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": true,
          "cost": 0.4687,
          "tokens": 1332463,
          "time": 435.9
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": true,
          "cost": 0.2902,
          "tokens": 207501,
          "time": 218.0
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": true,
          "cost": 0.3469,
          "tokens": 345875,
          "time": 272.4
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": false,
          "cost": 0.2021,
          "tokens": 265292,
          "time": 280.6
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": true,
          "cost": 0.3254,
          "tokens": 231996,
          "time": 302.1
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": true,
          "cost": 0.1444,
          "tokens": 82777,
          "time": 371.3
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": true,
          "cost": 0.625,
          "tokens": 513343,
          "time": 427.1
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": false,
          "cost": 0.6794,
          "tokens": 792388,
          "time": 584.0
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 0.1932,
          "tokens": 116257,
          "time": 249.9
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 0.1626,
          "tokens": 97359,
          "time": 153.7
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": false,
          "cost": 0.4448,
          "tokens": 314704,
          "time": 366.2
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": true,
          "cost": 0.2781,
          "tokens": 158605,
          "time": 387.3
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 0.4664,
          "tokens": 359964,
          "time": 325.3
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": false,
          "cost": 0.3459,
          "tokens": 266192,
          "time": 323.0
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 0.2968,
          "tokens": 209490,
          "time": 358.8
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 0.6812,
          "tokens": 1905266,
          "time": 593.2
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.4615,
          "tokens": 364209,
          "time": 316.4
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": true,
          "cost": 0.5696,
          "tokens": 529988,
          "time": 400.8
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": true,
          "cost": 0.2674,
          "tokens": 175334,
          "time": 212.4
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": false,
          "cost": 0.1854,
          "tokens": 121604,
          "time": 206.3
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": true,
          "cost": 0.368,
          "tokens": 262180,
          "time": 286.2
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": false,
          "cost": 0.3266,
          "tokens": 234635,
          "time": 338.6
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": true,
          "cost": 0.8063,
          "tokens": 979628,
          "time": 563.0
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 0.5893,
          "tokens": 469843,
          "time": 428.7
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": true,
          "cost": 0.4556,
          "tokens": 333974,
          "time": 403.8
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": true,
          "cost": 0.4152,
          "tokens": 571298,
          "time": 282.2
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": true,
          "cost": 0.1508,
          "tokens": 97463,
          "time": 289.4
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 0.1463,
          "tokens": 96595,
          "time": 108.9
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": true,
          "cost": 0.1261,
          "tokens": 81271,
          "time": 182.6
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": true,
          "cost": 0.0911,
          "tokens": 52322,
          "time": 144.8
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": true,
          "cost": 0.2725,
          "tokens": 226784,
          "time": 230.3
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": false,
          "cost": 0.5233,
          "tokens": 465675,
          "time": 318.8
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": true,
          "cost": 0.6252,
          "tokens": 544251,
          "time": 327.1
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": true,
          "cost": 0.5324,
          "tokens": 425109,
          "time": 329.7
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": false,
          "cost": 0.4829,
          "tokens": 526194,
          "time": 408.4
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": true,
          "cost": 0.6508,
          "tokens": 695719,
          "time": 412.1
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": true,
          "cost": 0.2701,
          "tokens": 728992,
          "time": 467.8
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": false,
          "cost": 0.7677,
          "tokens": 2463872,
          "time": 762.6
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": true,
          "cost": 0.2566,
          "tokens": 197549,
          "time": 318.1
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": false,
          "cost": 0.526,
          "tokens": 884760,
          "time": 1575.9
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": false,
          "cost": 0.6637,
          "tokens": 776343,
          "time": 453.7
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": true,
          "cost": 0.2238,
          "tokens": 152572,
          "time": 242.3
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": true,
          "cost": 0.515,
          "tokens": 647531,
          "time": 422.2
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": true,
          "cost": 0.7332,
          "tokens": 1029405,
          "time": 525.3
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": true,
          "cost": 0.2161,
          "tokens": 169037,
          "time": 253.9
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": true,
          "cost": 0.9042,
          "tokens": 1486419,
          "time": 619.5
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": true,
          "cost": 0.4272,
          "tokens": 361476,
          "time": 269.2
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": true,
          "cost": 0.3738,
          "tokens": 330003,
          "time": 471.2
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": false,
          "cost": 0.5388,
          "tokens": 623951,
          "time": 551.3
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": true,
          "cost": 0.343,
          "tokens": 291705,
          "time": 249.9
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": true,
          "cost": 0.2452,
          "tokens": 172647,
          "time": 235.5
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": true,
          "cost": 0.3067,
          "tokens": 257515,
          "time": 256.8
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": false,
          "cost": 0.6912,
          "tokens": 1779468,
          "time": 584.1
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": true,
          "cost": 0.8527,
          "tokens": 842695,
          "time": 435.3
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": true,
          "cost": 0.5213,
          "tokens": 462826,
          "time": 369.8
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": true,
          "cost": 0.2768,
          "tokens": 214133,
          "time": 300.7
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": true,
          "cost": 0.2797,
          "tokens": 197931,
          "time": 307.5
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": true,
          "cost": 0.3627,
          "tokens": 314929,
          "time": 275.1
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 0.4245,
          "tokens": 306047,
          "time": 285.0
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 0.2818,
          "tokens": 174295,
          "time": 214.2
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 0.2004,
          "tokens": 147052,
          "time": 206.6
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 0.393,
          "tokens": 773712,
          "time": 351.1
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": true,
          "cost": 0.4205,
          "tokens": 313217,
          "time": 373.5
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": true,
          "cost": 2.3546,
          "tokens": 8116063,
          "time": 791.7
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 0.1444,
          "tokens": 65495,
          "time": 165.8
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": false,
          "cost": 0.2203,
          "tokens": 172871,
          "time": 230.3
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": true,
          "cost": 0.7796,
          "tokens": 1703497,
          "time": 997.9
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": false,
          "cost": 0.1823,
          "tokens": 127186,
          "time": 226.5
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": true,
          "cost": 0.3122,
          "tokens": 254700,
          "time": 287.3
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": true,
          "cost": 0.2517,
          "tokens": 174599,
          "time": 278.3
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": true,
          "cost": 0.198,
          "tokens": 243159,
          "time": 392.9
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": false,
          "cost": 0.5477,
          "tokens": 472295,
          "time": 407.1
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 0.5383,
          "tokens": 399234,
          "time": 455.2
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 0.2349,
          "tokens": 151352,
          "time": 260.1
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": true,
          "cost": 0.3184,
          "tokens": 288471,
          "time": 251.4
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": false,
          "cost": 0.3084,
          "tokens": 222139,
          "time": 282.0
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": true,
          "cost": 0.4146,
          "tokens": 290848,
          "time": 400.4
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": true,
          "cost": 0.5148,
          "tokens": 402601,
          "time": 348.6
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 0.4873,
          "tokens": 506069,
          "time": 474.8
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": true,
          "cost": 0.3907,
          "tokens": 429433,
          "time": 248.7
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 0.3786,
          "tokens": 448711,
          "time": 399.2
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": true,
          "cost": 0.4904,
          "tokens": 471481,
          "time": 259.7
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": true,
          "cost": 0.1541,
          "tokens": 99499,
          "time": 224.0
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": true,
          "cost": 0.1463,
          "tokens": 87487,
          "time": 176.4
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": true,
          "cost": 0.2467,
          "tokens": 139576,
          "time": 257.8
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": true,
          "cost": 0.467,
          "tokens": 351199,
          "time": 485.8
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": false,
          "cost": 0.7349,
          "tokens": 963073,
          "time": 509.5
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": true,
          "cost": 0.3379,
          "tokens": 275770,
          "time": 302.0
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 0.6617,
          "tokens": 774597,
          "time": 561.5
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 0.2136,
          "tokens": 151122,
          "time": 281.6
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 0.8601,
          "tokens": 930581,
          "time": 519.2
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": true,
          "cost": 0.185,
          "tokens": 117410,
          "time": 209.3
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": true,
          "cost": 0.4302,
          "tokens": 481239,
          "time": 403.5
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": true,
          "cost": 0.38,
          "tokens": 338429,
          "time": 274.3
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 0.3186,
          "tokens": 256317,
          "time": 409.1
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": true,
          "cost": 0.2682,
          "tokens": 200007,
          "time": 262.9
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": false,
          "cost": 0.4867,
          "tokens": 435001,
          "time": 411.0
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": false,
          "cost": 0.4185,
          "tokens": 449080,
          "time": 409.5
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": false,
          "cost": 0.6346,
          "tokens": 880495,
          "time": 595.8
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 0.3975,
          "tokens": 326758,
          "time": 312.7
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": true,
          "cost": 0.3352,
          "tokens": 264304,
          "time": 269.8
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": true,
          "cost": 0.1609,
          "tokens": 126159,
          "time": 137.2
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": true,
          "cost": 0.1439,
          "tokens": 71573,
          "time": 234.0
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": true,
          "cost": 0.1727,
          "tokens": 127156,
          "time": 197.5
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": true,
          "cost": 0.4755,
          "tokens": 356333,
          "time": 506.2
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 0.1893,
          "tokens": 156892,
          "time": 266.4
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 0.254,
          "tokens": 145871,
          "time": 243.1
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.1819,
          "tokens": 115485,
          "time": 249.4
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": true,
          "cost": 0.3532,
          "tokens": 216267,
          "time": 450.7
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": false,
          "cost": 0.3815,
          "tokens": 352485,
          "time": 352.7
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": false,
          "cost": 0.3879,
          "tokens": 479465,
          "time": 459.6
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": false,
          "cost": 0.2053,
          "tokens": 125810,
          "time": 222.7
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": true,
          "cost": 0.1402,
          "tokens": 104820,
          "time": 181.9
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": true,
          "cost": 0.3053,
          "tokens": 276548,
          "time": 296.3
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 0.2799,
          "tokens": 265147,
          "time": 265.6
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": true,
          "cost": 0.3591,
          "tokens": 234567,
          "time": 377.8
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": true,
          "cost": 0.5621,
          "tokens": 509897,
          "time": 492.0
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": false,
          "cost": 0.4483,
          "tokens": 344964,
          "time": 483.7
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": true,
          "cost": 0.2163,
          "tokens": 154017,
          "time": 225.0
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": true,
          "cost": 0.2068,
          "tokens": 148123,
          "time": 268.4
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": false,
          "cost": 0.131,
          "tokens": 69476,
          "time": 193.8
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 0.1265,
          "tokens": 80161,
          "time": 172.6
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 0.1616,
          "tokens": 202086,
          "time": 222.4
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 0.1082,
          "tokens": 62139,
          "time": 146.9
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": false,
          "cost": 0.4128,
          "tokens": 400966,
          "time": 338.6
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": true,
          "cost": 0.6535,
          "tokens": 999863,
          "time": 746.9
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 0.379,
          "tokens": 295134,
          "time": 338.2
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": false,
          "cost": 0.4101,
          "tokens": 327846,
          "time": 444.5
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": false,
          "cost": 0.2652,
          "tokens": 275173,
          "time": 327.5
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 0.4479,
          "tokens": 409755,
          "time": 359.2
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": true,
          "cost": 0.3104,
          "tokens": 353553,
          "time": 372.1
        }
      ]
    },
    {
      "runKey": "rlm-sonnet-4.6",
      "harness": "trace-rlm",
      "model": "claude-sonnet-4.6",
      "modelName": "claude-sonnet-4.6",
      "reported": {
        "cost": 0.954,
        "tokens": 1100000,
        "time": 353,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": true,
          "cost": 0.2753,
          "tokens": 400424,
          "time": 204.0
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": true,
          "cost": 0.1942,
          "tokens": 252036,
          "time": 157.8
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": true,
          "cost": 0.3593,
          "tokens": 559474,
          "time": 221.8
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": false,
          "cost": 0.1928,
          "tokens": 218050,
          "time": 207.4
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": false,
          "cost": 0.3425,
          "tokens": 496478,
          "time": 253.6
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": false,
          "cost": 1.1748,
          "tokens": 707995,
          "time": 294.0
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": false,
          "cost": 1.7882,
          "tokens": 2466053,
          "time": 485.0
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": false,
          "cost": 0.1813,
          "tokens": 196744,
          "time": 146.9
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": false,
          "cost": 0.8889,
          "tokens": 1279375,
          "time": 390.7
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": true,
          "cost": 0.1764,
          "tokens": 222480,
          "time": 184.1
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": true,
          "cost": 3.0086,
          "tokens": 2708974,
          "time": 667.6
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": true,
          "cost": 1.9855,
          "tokens": 2156546,
          "time": 661.5
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": true,
          "cost": 2.328,
          "tokens": 3005930,
          "time": 684.9
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": true,
          "cost": 0.865,
          "tokens": 1233458,
          "time": 348.9
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": false,
          "cost": 0.6701,
          "tokens": 1034463,
          "time": 250.7
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": false,
          "cost": 0.4813,
          "tokens": 797945,
          "time": 251.8
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 0.6627,
          "tokens": 1119205,
          "time": 583.6
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": true,
          "cost": 0.218,
          "tokens": 295502,
          "time": 566.5
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": false,
          "cost": 4.5761,
          "tokens": 3839961,
          "time": 1060.8
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": false,
          "cost": 0.8553,
          "tokens": 1336513,
          "time": 576.1
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 0.549,
          "tokens": 970437,
          "time": 407.7
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": false,
          "cost": 0.2014,
          "tokens": 244057,
          "time": 302.9
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": true,
          "cost": 1.0668,
          "tokens": 2057251,
          "time": 630.9
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 0.7582,
          "tokens": 1017209,
          "time": 598.5
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": false,
          "cost": 1.7654,
          "tokens": 3521409,
          "time": 1039.9
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 0.889,
          "tokens": 1539313,
          "time": 570.6
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 0.2698,
          "tokens": 347535,
          "time": 406.8
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 1.8932,
          "tokens": 1525258,
          "time": 719.1
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 0.6688,
          "tokens": 1176639,
          "time": 581.7
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 10.7779,
          "tokens": 5757427,
          "time": 1104.3
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": true,
          "cost": 0.3321,
          "tokens": 386039,
          "time": 576.8
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": false,
          "cost": 5.0687,
          "tokens": 10530161,
          "time": 1761.5
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": true,
          "cost": 1.1414,
          "tokens": 1151280,
          "time": 584.2
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": true,
          "cost": 1.2031,
          "tokens": 2389718,
          "time": 833.5
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 1.0745,
          "tokens": 1881842,
          "time": 815.0
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": true,
          "cost": 0.6617,
          "tokens": 1131827,
          "time": 718.0
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 0.7011,
          "tokens": 1269580,
          "time": 830.1
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 2.1595,
          "tokens": 2237946,
          "time": 944.9
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": true,
          "cost": 0.7323,
          "tokens": 930897,
          "time": 782.0
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 1.2955,
          "tokens": 2184547,
          "time": 1053.5
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": true,
          "cost": 3.9261,
          "tokens": 3502230,
          "time": 899.7
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 0.3404,
          "tokens": 476781,
          "time": 571.7
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": false,
          "cost": 0.4132,
          "tokens": 341299,
          "time": 518.7
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": true,
          "cost": 4.29,
          "tokens": 2728857,
          "time": 791.8
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": false,
          "cost": 2.7167,
          "tokens": 2499892,
          "time": 787.2
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 0.1705,
          "tokens": 187983,
          "time": 194.5
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": false,
          "cost": 0.4093,
          "tokens": 601117,
          "time": 335.1
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": false,
          "cost": 0.3069,
          "tokens": 311230,
          "time": 209.3
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": true,
          "cost": 0.1532,
          "tokens": 182910,
          "time": 161.2
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": true,
          "cost": 0.335,
          "tokens": 434985,
          "time": 319.5
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": true,
          "cost": 1.7966,
          "tokens": 1426222,
          "time": 473.3
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": false,
          "cost": 0.3155,
          "tokens": 426282,
          "time": 357.2
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": false,
          "cost": 1.0703,
          "tokens": 1027825,
          "time": 379.8
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": true,
          "cost": 0.9752,
          "tokens": 1667446,
          "time": 540.7
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 3.5164,
          "tokens": 2239356,
          "time": 567.5
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 0.2625,
          "tokens": 339163,
          "time": 299.1
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 0.2394,
          "tokens": 322168,
          "time": 248.0
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": true,
          "cost": 0.1872,
          "tokens": 220774,
          "time": 224.7
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 0.431,
          "tokens": 650814,
          "time": 287.3
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": true,
          "cost": 0.4774,
          "tokens": 797644,
          "time": 335.6
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": true,
          "cost": 0.1376,
          "tokens": 134780,
          "time": 130.0
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 0.7288,
          "tokens": 1173674,
          "time": 337.8
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": true,
          "cost": 0.3044,
          "tokens": 376068,
          "time": 365.0
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": false,
          "cost": 1.2351,
          "tokens": 2282945,
          "time": 611.7
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": true,
          "cost": 0.8194,
          "tokens": 1503683,
          "time": 498.4
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": true,
          "cost": 0.1197,
          "tokens": 123762,
          "time": 141.7
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": true,
          "cost": 1.1243,
          "tokens": 2189335,
          "time": 398.9
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": true,
          "cost": 0.355,
          "tokens": 499032,
          "time": 267.1
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": true,
          "cost": 0.6523,
          "tokens": 1012436,
          "time": 348.4
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": true,
          "cost": 0.0945,
          "tokens": 99019,
          "time": 300.2
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": true,
          "cost": 0.556,
          "tokens": 926484,
          "time": 330.7
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": true,
          "cost": 0.8449,
          "tokens": 1522953,
          "time": 420.9
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 0.3115,
          "tokens": 391326,
          "time": 314.6
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 0.1533,
          "tokens": 131144,
          "time": 235.3
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": false,
          "cost": 0.3727,
          "tokens": 633965,
          "time": 341.3
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": true,
          "cost": 0.5703,
          "tokens": 863487,
          "time": 404.4
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 3.3784,
          "tokens": 1655698,
          "time": 328.2
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": false,
          "cost": 0.8642,
          "tokens": 1576742,
          "time": 486.4
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 2.4186,
          "tokens": 1176381,
          "time": 421.5
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 0.1292,
          "tokens": 142746,
          "time": 254.9
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.0719,
          "tokens": 59643,
          "time": 250.4
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": true,
          "cost": 0.5718,
          "tokens": 990985,
          "time": 374.5
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": true,
          "cost": 0.1445,
          "tokens": 163641,
          "time": 269.9
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": true,
          "cost": 0.142,
          "tokens": 122370,
          "time": 142.4
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": false,
          "cost": 0.1799,
          "tokens": 196198,
          "time": 132.3
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": false,
          "cost": 0.6944,
          "tokens": 1077806,
          "time": 248.4
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": false,
          "cost": 3.6525,
          "tokens": 2334841,
          "time": 317.7
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": true,
          "cost": 0.5547,
          "tokens": 864316,
          "time": 186.6
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": true,
          "cost": 1.474,
          "tokens": 2896815,
          "time": 380.6
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": true,
          "cost": 0.9977,
          "tokens": 1896155,
          "time": 307.9
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": true,
          "cost": 0.4445,
          "tokens": 660419,
          "time": 263.9
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 0.1227,
          "tokens": 121206,
          "time": 152.5
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": true,
          "cost": 0.0552,
          "tokens": 46818,
          "time": 82.0
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": true,
          "cost": 0.2885,
          "tokens": 393208,
          "time": 112.5
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": false,
          "cost": 0.0898,
          "tokens": 75733,
          "time": 66.1
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": true,
          "cost": 1.8625,
          "tokens": 1181606,
          "time": 209.3
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": false,
          "cost": 0.3962,
          "tokens": 606892,
          "time": 167.8
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": true,
          "cost": 1.3527,
          "tokens": 1033340,
          "time": 173.6
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": true,
          "cost": 0.6335,
          "tokens": 1022591,
          "time": 196.8
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": false,
          "cost": 2.3976,
          "tokens": 3791348,
          "time": 826.8
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": true,
          "cost": 1.3833,
          "tokens": 2478653,
          "time": 761.6
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": false,
          "cost": 1.3058,
          "tokens": 2657855,
          "time": 723.0
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": true,
          "cost": 0.7227,
          "tokens": 480581,
          "time": 122.4
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": false,
          "cost": 2.7735,
          "tokens": 4776037,
          "time": 840.3
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": false,
          "cost": 0.5444,
          "tokens": 852653,
          "time": 372.2
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": true,
          "cost": 0.3102,
          "tokens": 478973,
          "time": 179.2
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": true,
          "cost": 3.1686,
          "tokens": 3022741,
          "time": 644.7
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": false,
          "cost": 3.3082,
          "tokens": 7756287,
          "time": 926.0
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": false,
          "cost": 0.943,
          "tokens": 1402401,
          "time": 514.3
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": true,
          "cost": 0.7261,
          "tokens": 1166075,
          "time": 606.3
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": true,
          "cost": 0.2933,
          "tokens": 347166,
          "time": 117.6
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": true,
          "cost": 2.4303,
          "tokens": 1137169,
          "time": 141.9
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": false,
          "cost": 0.3735,
          "tokens": 580949,
          "time": 274.9
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": true,
          "cost": 0.1871,
          "tokens": 203977,
          "time": 103.2
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": true,
          "cost": 0.1663,
          "tokens": 190024,
          "time": 100.5
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": false,
          "cost": 0.3978,
          "tokens": 606445,
          "time": 260.7
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": false,
          "cost": 1.9446,
          "tokens": 2157631,
          "time": 602.4
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": false,
          "cost": 1.1107,
          "tokens": 1808879,
          "time": 615.6
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": true,
          "cost": 0.1308,
          "tokens": 129739,
          "time": 110.3
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": true,
          "cost": 0.2099,
          "tokens": 269437,
          "time": 203.7
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": true,
          "cost": 0.6077,
          "tokens": 1088125,
          "time": 528.7
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": true,
          "cost": 0.4161,
          "tokens": 591749,
          "time": 470.4
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 0.3607,
          "tokens": 483425,
          "time": 457.5
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 0.4255,
          "tokens": 438567,
          "time": 211.2
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 0.1399,
          "tokens": 130822,
          "time": 162.5
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 2.5075,
          "tokens": 1320918,
          "time": 490.6
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": false,
          "cost": 0.5949,
          "tokens": 726619,
          "time": 582.5
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": true,
          "cost": 1.029,
          "tokens": 1148858,
          "time": 525.6
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 1.2024,
          "tokens": 547623,
          "time": 469.9
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": false,
          "cost": 0.2614,
          "tokens": 381881,
          "time": 469.2
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": true,
          "cost": 0.1353,
          "tokens": 123522,
          "time": 426.9
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": false,
          "cost": 0.2823,
          "tokens": 398698,
          "time": 472.1
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": true,
          "cost": 0.2197,
          "tokens": 282958,
          "time": 436.4
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": false,
          "cost": 0.2794,
          "tokens": 377782,
          "time": 336.5
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": false,
          "cost": 0.38,
          "tokens": 503389,
          "time": 359.6
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": false,
          "cost": 0.6522,
          "tokens": 1113984,
          "time": 373.7
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 1.1531,
          "tokens": 1366021,
          "time": 446.0
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 0.4448,
          "tokens": 478884,
          "time": 364.2
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": true,
          "cost": 0.3885,
          "tokens": 549979,
          "time": 182.4
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": true,
          "cost": 0.3271,
          "tokens": 455386,
          "time": 164.9
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": true,
          "cost": 0.6165,
          "tokens": 989191,
          "time": 233.2
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": true,
          "cost": 0.2101,
          "tokens": 235888,
          "time": 161.8
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 0.3175,
          "tokens": 397506,
          "time": 135.0
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": true,
          "cost": 2.6856,
          "tokens": 1714324,
          "time": 248.2
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 0.3718,
          "tokens": 539772,
          "time": 130.8
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": true,
          "cost": 0.2676,
          "tokens": 326844,
          "time": 93.6
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": false,
          "cost": 0.916,
          "tokens": 1516879,
          "time": 289.8
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": false,
          "cost": 0.8539,
          "tokens": 607234,
          "time": 148.5
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": true,
          "cost": 0.9278,
          "tokens": 1866681,
          "time": 253.1
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": true,
          "cost": 0.7027,
          "tokens": 1108565,
          "time": 327.0
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": false,
          "cost": 2.859,
          "tokens": 1933453,
          "time": 261.4
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": false,
          "cost": 1.2126,
          "tokens": 1021933,
          "time": 198.7
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 0.5731,
          "tokens": 1010506,
          "time": 176.3
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 0.3525,
          "tokens": 483222,
          "time": 123.9
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 1.6073,
          "tokens": 1844936,
          "time": 271.9
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": true,
          "cost": 0.2576,
          "tokens": 329309,
          "time": 126.4
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": false,
          "cost": 1.509,
          "tokens": 1516237,
          "time": 225.6
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": false,
          "cost": 0.3404,
          "tokens": 464619,
          "time": 155.9
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 2.1749,
          "tokens": 2104861,
          "time": 396.5
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": true,
          "cost": 0.275,
          "tokens": 382046,
          "time": 136.0
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": false,
          "cost": 0.4669,
          "tokens": 424681,
          "time": 164.8
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": true,
          "cost": 0.5395,
          "tokens": 885541,
          "time": 194.9
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": true,
          "cost": 0.3918,
          "tokens": 588128,
          "time": 140.7
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 0.3172,
          "tokens": 462210,
          "time": 156.7
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": true,
          "cost": 0.328,
          "tokens": 470643,
          "time": 156.0
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": true,
          "cost": 0.1913,
          "tokens": 222100,
          "time": 99.3
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": true,
          "cost": 0.1052,
          "tokens": 100946,
          "time": 55.5
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": true,
          "cost": 0.1982,
          "tokens": 249039,
          "time": 96.8
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": true,
          "cost": 0.988,
          "tokens": 1219888,
          "time": 256.4
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 0.0966,
          "tokens": 90970,
          "time": 52.2
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 0.0757,
          "tokens": 62651,
          "time": 51.0
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.1135,
          "tokens": 105677,
          "time": 53.0
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": true,
          "cost": 0.1915,
          "tokens": 226782,
          "time": 80.5
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": true,
          "cost": 1.3982,
          "tokens": 937616,
          "time": 232.4
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": true,
          "cost": 2.7164,
          "tokens": 1524748,
          "time": 159.6
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": false,
          "cost": 0.0964,
          "tokens": 91367,
          "time": 55.9
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": true,
          "cost": 0.6278,
          "tokens": 598808,
          "time": 132.8
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": false,
          "cost": 0.7714,
          "tokens": 1274060,
          "time": 213.4
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 0.7806,
          "tokens": 991916,
          "time": 153.6
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": false,
          "cost": 0.4853,
          "tokens": 749737,
          "time": 208.9
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": false,
          "cost": 0.4995,
          "tokens": 929905,
          "time": 182.5
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": false,
          "cost": 0.5259,
          "tokens": 958029,
          "time": 198.2
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": true,
          "cost": 0.3049,
          "tokens": 437023,
          "time": 115.5
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 0.3571,
          "tokens": 536185,
          "time": 142.6
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": false,
          "cost": 0.884,
          "tokens": 621297,
          "time": 126.8
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 0.2413,
          "tokens": 212025,
          "time": 106.7
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 0.4046,
          "tokens": 656332,
          "time": 135.5
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 0.2345,
          "tokens": 270487,
          "time": 96.9
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": false,
          "cost": 0.3956,
          "tokens": 557647,
          "time": 125.0
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": true,
          "cost": 0.4128,
          "tokens": 634946,
          "time": 146.5
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 0.0801,
          "tokens": 55817,
          "time": 61.7
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": false,
          "cost": 1.0765,
          "tokens": 2431677,
          "time": 268.3
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": true,
          "cost": 0.6185,
          "tokens": 1111368,
          "time": 149.0
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 0.2825,
          "tokens": 364406,
          "time": 126.2
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 7.5483,
          "tokens": 3352863,
          "time": 266.1
        }
      ]
    },
    {
      "runKey": "codex-gpt-5-codex",
      "harness": "codex",
      "model": "gpt-5-codex",
      "modelName": "gpt-5-codex",
      "reported": {
        "cost": 0.342,
        "tokens": 1000000,
        "time": 350,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": false,
          "cost": 0.2281,
          "tokens": 530209,
          "time": 115.7
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": false,
          "cost": 0.2509,
          "tokens": 583713,
          "time": 178.9
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": false,
          "cost": 0.5079,
          "tokens": 1437730,
          "time": 743.7
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": false,
          "cost": 0.2355,
          "tokens": 639402,
          "time": 205.6
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": false,
          "cost": 0.168,
          "tokens": 528291,
          "time": 101.3
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": false,
          "cost": 0.2341,
          "tokens": 808461,
          "time": 137.0
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": false,
          "cost": 0.2772,
          "tokens": 736928,
          "time": 159.0
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": false,
          "cost": 0.0174,
          "tokens": 62663,
          "time": 30.0
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": false,
          "cost": 0.2042,
          "tokens": 598484,
          "time": 191.3
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": true,
          "cost": 0.1715,
          "tokens": 517303,
          "time": 225.2
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": true,
          "cost": 0.4882,
          "tokens": 1435578,
          "time": 466.9
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": true,
          "cost": 0.5607,
          "tokens": 1680125,
          "time": 287.4
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": false,
          "cost": 0.0075,
          "tokens": 28648,
          "time": 12.4
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": false,
          "cost": 0.4296,
          "tokens": 887247,
          "time": 214.4
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": false,
          "cost": 0.3639,
          "tokens": 1035399,
          "time": 671.0
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": false,
          "cost": 0.2274,
          "tokens": 561628,
          "time": 147.5
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 0.3313,
          "tokens": 880218,
          "time": 432.6
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": false,
          "cost": 0.1606,
          "tokens": 528685,
          "time": 194.8
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": true,
          "cost": 0.166,
          "tokens": 500968,
          "time": 147.8
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": false,
          "cost": 0.4747,
          "tokens": 1724613,
          "time": 1030.7
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 0.3106,
          "tokens": 872721,
          "time": 116.6
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": false,
          "cost": 0.1808,
          "tokens": 480052,
          "time": 527.6
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 0.0462,
          "tokens": 154174,
          "time": 30.5
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 0.3214,
          "tokens": 752409,
          "time": 263.9
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": true,
          "cost": 0.2935,
          "tokens": 914652,
          "time": 677.9
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 0.3743,
          "tokens": 1190041,
          "time": 770.2
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 0.2712,
          "tokens": 767561,
          "time": 367.9
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 0.3774,
          "tokens": 930114,
          "time": 244.1
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 0.6046,
          "tokens": 1719936,
          "time": 321.6
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 0.2132,
          "tokens": 889474,
          "time": 505.7
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": true,
          "cost": 0.783,
          "tokens": 1775008,
          "time": 669.0
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": true,
          "cost": 0.4369,
          "tokens": 1653295,
          "time": 465.3
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": false,
          "cost": 0.5416,
          "tokens": 1493869,
          "time": 671.7
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": false,
          "cost": 0.7918,
          "tokens": 2256421,
          "time": 525.8
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 1.286,
          "tokens": 4346515,
          "time": 417.6
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": true,
          "cost": 0.2779,
          "tokens": 891200,
          "time": 209.4
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 0.2206,
          "tokens": 604686,
          "time": 219.0
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 0.559,
          "tokens": 1027369,
          "time": 488.5
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": false,
          "cost": 0.4042,
          "tokens": 869354,
          "time": 224.0
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 0.2753,
          "tokens": 1022607,
          "time": 601.7
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": true,
          "cost": 0.5814,
          "tokens": 2182873,
          "time": 1021.6
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 0.0109,
          "tokens": 43194,
          "time": 14.1
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": false,
          "cost": 0.1441,
          "tokens": 287294,
          "time": 84.2
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": false,
          "cost": 1.173,
          "tokens": 2730918,
          "time": 489.1
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": false,
          "cost": 0.4259,
          "tokens": 1977535,
          "time": 1270.7
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 0.1517,
          "tokens": 512058,
          "time": 319.6
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": true,
          "cost": 0.1126,
          "tokens": 397880,
          "time": 53.9
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": false,
          "cost": 0.1824,
          "tokens": 561519,
          "time": 171.8
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": true,
          "cost": 0.2855,
          "tokens": 961651,
          "time": 291.2
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": false,
          "cost": 0.3935,
          "tokens": 1241910,
          "time": 208.3
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": false,
          "cost": 0.5609,
          "tokens": 1264049,
          "time": 468.0
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": false,
          "cost": 0.3184,
          "tokens": 919589,
          "time": 162.3
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": true,
          "cost": 0.3767,
          "tokens": 1224748,
          "time": 632.6
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": false,
          "cost": 0.041,
          "tokens": 168528,
          "time": 26.1
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 0.1625,
          "tokens": 528845,
          "time": 115.6
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 0.1958,
          "tokens": 627522,
          "time": 86.0
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 0.1924,
          "tokens": 456716,
          "time": 234.9
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": false,
          "cost": 0.2177,
          "tokens": 680492,
          "time": 225.0
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 0.2029,
          "tokens": 672316,
          "time": 438.7
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": true,
          "cost": 0.1539,
          "tokens": 517480,
          "time": 104.1
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": false,
          "cost": 0.7241,
          "tokens": 2472120,
          "time": 605.0
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 0.6507,
          "tokens": 2281871,
          "time": 506.7
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": false,
          "cost": 0.6798,
          "tokens": 2314302,
          "time": 589.5
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": false,
          "cost": 0.6291,
          "tokens": 2008343,
          "time": 962.2
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": true,
          "cost": 0.355,
          "tokens": 1042217,
          "time": 588.3
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": true,
          "cost": 0.3344,
          "tokens": 1148143,
          "time": 1245.7
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": true,
          "cost": 0.2716,
          "tokens": 709528,
          "time": 181.7
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": true,
          "cost": 0.5099,
          "tokens": 1356041,
          "time": 852.4
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": true,
          "cost": 0.2652,
          "tokens": 642284,
          "time": 503.8
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": true,
          "cost": 0.0777,
          "tokens": 269695,
          "time": 81.0
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": true,
          "cost": 0.1332,
          "tokens": 369520,
          "time": 184.0
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": false,
          "cost": 1.5585,
          "tokens": 5122252,
          "time": 1078.0
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 0.2383,
          "tokens": 762664,
          "time": 372.2
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 0.3295,
          "tokens": 1076960,
          "time": 331.0
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": true,
          "cost": 0.2418,
          "tokens": 554718,
          "time": 311.0
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": false,
          "cost": 0.2837,
          "tokens": 838349,
          "time": 176.9
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 0.2912,
          "tokens": 750308,
          "time": 243.2
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": true,
          "cost": 0.6019,
          "tokens": 1450341,
          "time": 1118.5
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 0.2173,
          "tokens": 528076,
          "time": 174.9
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 0.1653,
          "tokens": 515450,
          "time": 652.0
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.2209,
          "tokens": 854275,
          "time": 1036.1
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": true,
          "cost": 0.2258,
          "tokens": 636013,
          "time": 173.8
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": false,
          "cost": 0.0039,
          "tokens": 14211,
          "time": 11.4
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": true,
          "cost": 0.5239,
          "tokens": 1431790,
          "time": 398.1
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": false,
          "cost": 0.2332,
          "tokens": 829924,
          "time": 239.1
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": true,
          "cost": 0.2812,
          "tokens": 804577,
          "time": 269.1
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": false,
          "cost": 0.0558,
          "tokens": 144871,
          "time": 34.9
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 0.2388,
          "tokens": 516161,
          "time": 133.4
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": true,
          "cost": 0.6258,
          "tokens": 1506697,
          "time": 788.4
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": true,
          "cost": 0.6186,
          "tokens": 1405876,
          "time": 1240.8
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": false,
          "cost": 0.0484,
          "tokens": 200212,
          "time": 31.3
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 0.3501,
          "tokens": 1493175,
          "time": 1167.9
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": true,
          "cost": 0.1315,
          "tokens": 436079,
          "time": 143.0
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": true,
          "cost": 0.1912,
          "tokens": 763790,
          "time": 289.0
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": true,
          "cost": 0.1776,
          "tokens": 458408,
          "time": 409.3
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": false,
          "cost": 0.5948,
          "tokens": 2036198,
          "time": 390.9
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": true,
          "cost": 0.3745,
          "tokens": 1695452,
          "time": 358.9
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": true,
          "cost": 0.3149,
          "tokens": 755838,
          "time": 227.9
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": false,
          "cost": 0.1722,
          "tokens": 453355,
          "time": 196.5
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": false,
          "cost": 1.8654,
          "tokens": 6006240,
          "time": 1042.2
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": true,
          "cost": 0.2874,
          "tokens": 800226,
          "time": 411.2
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": false,
          "cost": 0.8972,
          "tokens": 2568074,
          "time": 1079.5
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": true,
          "cost": 0.302,
          "tokens": 1071567,
          "time": 418.9
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": true,
          "cost": 0.2485,
          "tokens": 839532,
          "time": 811.5
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": true,
          "cost": 0.4718,
          "tokens": 1094898,
          "time": 409.4
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": true,
          "cost": 0.515,
          "tokens": 1445305,
          "time": 248.4
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": false,
          "cost": 0.2924,
          "tokens": 980942,
          "time": 470.4
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": true,
          "cost": 0.401,
          "tokens": 1007210,
          "time": 1079.4
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": true,
          "cost": 0.6908,
          "tokens": 1433382,
          "time": 596.2
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": false,
          "cost": 0.3735,
          "tokens": 1165513,
          "time": 701.2
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": true,
          "cost": 0.1617,
          "tokens": 548995,
          "time": 215.5
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": true,
          "cost": 0.4184,
          "tokens": 1468872,
          "time": 714.0
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": false,
          "cost": 0.0327,
          "tokens": 103134,
          "time": 31.6
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": true,
          "cost": 0.1679,
          "tokens": 459462,
          "time": 210.6
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": false,
          "cost": 0.0773,
          "tokens": 260352,
          "time": 114.1
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": true,
          "cost": 0.162,
          "tokens": 439575,
          "time": 146.8
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": true,
          "cost": 0.4955,
          "tokens": 1374782,
          "time": 1014.7
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": true,
          "cost": 0.5166,
          "tokens": 1867073,
          "time": 333.4
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": true,
          "cost": 0.2633,
          "tokens": 928153,
          "time": 141.4
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": false,
          "cost": 0.0245,
          "tokens": 92523,
          "time": 25.6
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": false,
          "cost": 0.2743,
          "tokens": 897989,
          "time": 197.7
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": true,
          "cost": 0.1656,
          "tokens": 506249,
          "time": 116.6
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 0.2164,
          "tokens": 639169,
          "time": 498.0
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 0.0781,
          "tokens": 189041,
          "time": 200.6
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 0.0864,
          "tokens": 253974,
          "time": 83.8
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 0.4923,
          "tokens": 1878039,
          "time": 227.2
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": false,
          "cost": 0.4514,
          "tokens": 1010686,
          "time": 194.5
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": false,
          "cost": 0.9286,
          "tokens": 2792118,
          "time": 908.8
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 0.0175,
          "tokens": 64962,
          "time": 25.6
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": false,
          "cost": 0.3527,
          "tokens": 1120018,
          "time": 407.7
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": true,
          "cost": 0.2524,
          "tokens": 753183,
          "time": 160.8
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": true,
          "cost": 0.8906,
          "tokens": 2668800,
          "time": 1122.5
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": true,
          "cost": 0.2174,
          "tokens": 582152,
          "time": 126.8
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": true,
          "cost": 0.3274,
          "tokens": 1146662,
          "time": 116.7
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": false,
          "cost": 0.1964,
          "tokens": 500451,
          "time": 197.9
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": false,
          "cost": 0.2401,
          "tokens": 778481,
          "time": 152.3
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 0.3561,
          "tokens": 1132259,
          "time": 170.4
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 0.1804,
          "tokens": 541358,
          "time": 306.9
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": true,
          "cost": 0.3705,
          "tokens": 1306216,
          "time": 160.6
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": true,
          "cost": 0.179,
          "tokens": 540437,
          "time": 126.0
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": false,
          "cost": 0.0338,
          "tokens": 63414,
          "time": 29.4
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": true,
          "cost": 0.1214,
          "tokens": 451316,
          "time": 134.2
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 0.2877,
          "tokens": 730074,
          "time": 263.1
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": true,
          "cost": 0.526,
          "tokens": 1433705,
          "time": 293.1
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 0.1926,
          "tokens": 468757,
          "time": 99.1
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": true,
          "cost": 0.5846,
          "tokens": 1362015,
          "time": 205.4
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": true,
          "cost": 0.2956,
          "tokens": 614719,
          "time": 287.8
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": true,
          "cost": 0.1182,
          "tokens": 365285,
          "time": 81.0
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": true,
          "cost": 0.2353,
          "tokens": 600803,
          "time": 195.0
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": true,
          "cost": 0.2996,
          "tokens": 766245,
          "time": 562.5
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": false,
          "cost": 0.3409,
          "tokens": 1310684,
          "time": 254.9
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": true,
          "cost": 0.2345,
          "tokens": 664218,
          "time": 175.6
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 1.1759,
          "tokens": 4118563,
          "time": 726.5
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 0.3313,
          "tokens": 1197416,
          "time": 1014.3
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 0.3952,
          "tokens": 1195878,
          "time": 306.8
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": true,
          "cost": 0.4295,
          "tokens": 1170030,
          "time": 491.6
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": true,
          "cost": 0.3129,
          "tokens": 914749,
          "time": 389.1
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": true,
          "cost": 0.1307,
          "tokens": 361229,
          "time": 217.7
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 0.3958,
          "tokens": 1239780,
          "time": 238.1
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": true,
          "cost": 0.1517,
          "tokens": 560573,
          "time": 356.7
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": false,
          "cost": 0.0085,
          "tokens": 14672,
          "time": 26.5
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": false,
          "cost": 1.0203,
          "tokens": 2949754,
          "time": 375.1
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": false,
          "cost": 0.5877,
          "tokens": 1674336,
          "time": 325.5
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 0.4707,
          "tokens": 1206163,
          "time": 277.3
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": true,
          "cost": 0.3794,
          "tokens": 1084625,
          "time": 176.8
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": true,
          "cost": 0.2002,
          "tokens": 667892,
          "time": 212.9
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": true,
          "cost": 0.0863,
          "tokens": 326497,
          "time": 66.0
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": false,
          "cost": 0.0159,
          "tokens": 62144,
          "time": 24.4
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": true,
          "cost": 0.4668,
          "tokens": 1068851,
          "time": 248.8
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 0.1653,
          "tokens": 422020,
          "time": 87.5
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 0.2323,
          "tokens": 689139,
          "time": 196.5
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.1958,
          "tokens": 726752,
          "time": 155.6
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": true,
          "cost": 0.1457,
          "tokens": 427546,
          "time": 103.8
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": true,
          "cost": 0.4133,
          "tokens": 1247960,
          "time": 994.8
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": false,
          "cost": 0.2136,
          "tokens": 520262,
          "time": 157.6
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": false,
          "cost": 0.1547,
          "tokens": 445245,
          "time": 116.4
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": true,
          "cost": 0.3508,
          "tokens": 960927,
          "time": 184.1
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": false,
          "cost": 0.0486,
          "tokens": 188249,
          "time": 24.6
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 0.3149,
          "tokens": 973678,
          "time": 266.7
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": true,
          "cost": 0.407,
          "tokens": 1270849,
          "time": 198.6
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": true,
          "cost": 0.2813,
          "tokens": 931382,
          "time": 216.0
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": true,
          "cost": 0.1747,
          "tokens": 627864,
          "time": 103.2
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": true,
          "cost": 0.4044,
          "tokens": 1487556,
          "time": 834.6
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 0.2271,
          "tokens": 705262,
          "time": 87.3
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": false,
          "cost": 0.1372,
          "tokens": 470334,
          "time": 168.5
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 0.2757,
          "tokens": 1085583,
          "time": 218.2
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 0.2447,
          "tokens": 737449,
          "time": 123.6
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 0.3377,
          "tokens": 795491,
          "time": 132.8
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": true,
          "cost": 0.2802,
          "tokens": 925278,
          "time": 245.7
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": false,
          "cost": 1.8288,
          "tokens": 4965165,
          "time": 348.4
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 0.3867,
          "tokens": 960642,
          "time": 452.5
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": true,
          "cost": 0.4008,
          "tokens": 943953,
          "time": 139.1
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": true,
          "cost": 0.1532,
          "tokens": 404995,
          "time": 82.7
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 0.2453,
          "tokens": 537686,
          "time": 178.6
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 0.0061,
          "tokens": 28422,
          "time": 14.2
        }
      ]
    },
    {
      "runKey": "claudecode-opus-4.8",
      "harness": "claude-code",
      "model": "claude-opus-4.8",
      "modelName": "claude-opus-4.8",
      "reported": {
        "cost": 2.519,
        "tokens": 1000000,
        "time": 123,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": false,
          "cost": 1.8014,
          "tokens": 719606,
          "time": 77.5
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": false,
          "cost": 2.1658,
          "tokens": 870948,
          "time": 90.4
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": false,
          "cost": 3.5399,
          "tokens": 1548113,
          "time": 151.0
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": true,
          "cost": 2.308,
          "tokens": 996996,
          "time": 105.6
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": true,
          "cost": 3.3174,
          "tokens": 1426284,
          "time": 160.5
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": false,
          "cost": 3.3855,
          "tokens": 1360836,
          "time": 158.8
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": false,
          "cost": 2.6228,
          "tokens": 1036432,
          "time": 130.4
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": true,
          "cost": 1.8029,
          "tokens": 688876,
          "time": 73.0
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": false,
          "cost": 1.9637,
          "tokens": 787389,
          "time": 107.2
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": true,
          "cost": 1.6172,
          "tokens": 731182,
          "time": 70.2
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": true,
          "cost": 1.8172,
          "tokens": 748900,
          "time": 98.2
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": true,
          "cost": 2.3412,
          "tokens": 822694,
          "time": 113.1
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": true,
          "cost": 3.5191,
          "tokens": 1449276,
          "time": 166.2
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": false,
          "cost": 2.0222,
          "tokens": 850690,
          "time": 101.2
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": true,
          "cost": 3.6722,
          "tokens": 1484887,
          "time": 182.2
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": false,
          "cost": 4.3822,
          "tokens": 1874131,
          "time": 191.6
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 3.8621,
          "tokens": 1589302,
          "time": 205.2
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": true,
          "cost": 1.6514,
          "tokens": 654049,
          "time": 82.5
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": false,
          "cost": 2.0573,
          "tokens": 887754,
          "time": 102.8
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": false,
          "cost": 3.6145,
          "tokens": 1535526,
          "time": 167.5
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 2.8007,
          "tokens": 1104747,
          "time": 171.5
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": true,
          "cost": 2.2551,
          "tokens": 902902,
          "time": 112.0
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 3.624,
          "tokens": 1464471,
          "time": 186.1
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 2.686,
          "tokens": 1125918,
          "time": 131.8
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": false,
          "cost": 3.2308,
          "tokens": 1395544,
          "time": 159.5
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 4.692,
          "tokens": 1203770,
          "time": 172.9
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 2.1551,
          "tokens": 899480,
          "time": 94.9
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 1.9052,
          "tokens": 812721,
          "time": 116.1
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 2.6274,
          "tokens": 1030671,
          "time": 140.0
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 2.8752,
          "tokens": 1204966,
          "time": 125.4
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": false,
          "cost": 3.1408,
          "tokens": 1200495,
          "time": 162.8
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": true,
          "cost": 2.5569,
          "tokens": 966930,
          "time": 104.4
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": false,
          "cost": 2.1438,
          "tokens": 909578,
          "time": 91.5
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": true,
          "cost": 2.3963,
          "tokens": 987498,
          "time": 81.8
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 2.2219,
          "tokens": 915644,
          "time": 101.6
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": true,
          "cost": 2.4712,
          "tokens": 897013,
          "time": 80.0
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 2.469,
          "tokens": 930435,
          "time": 123.6
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 2.7282,
          "tokens": 1150679,
          "time": 163.0
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": false,
          "cost": 4.0715,
          "tokens": 1621399,
          "time": 205.8
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 2.5854,
          "tokens": 1038657,
          "time": 162.3
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": false,
          "cost": 2.8204,
          "tokens": 1165043,
          "time": 138.0
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 2.3689,
          "tokens": 848742,
          "time": 119.6
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": false,
          "cost": 2.526,
          "tokens": 914516,
          "time": 130.6
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": false,
          "cost": 2.2319,
          "tokens": 1001398,
          "time": 107.7
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": false,
          "cost": 2.0532,
          "tokens": 783116,
          "time": 120.1
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 3.4958,
          "tokens": 1284136,
          "time": 149.2
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": false,
          "cost": 2.8785,
          "tokens": 1023626,
          "time": 114.8
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": false,
          "cost": 1.3893,
          "tokens": 519290,
          "time": 66.3
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": true,
          "cost": 1.5577,
          "tokens": 625426,
          "time": 75.9
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": true,
          "cost": 3.1722,
          "tokens": 1120737,
          "time": 101.3
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": false,
          "cost": 3.8826,
          "tokens": 1476553,
          "time": 168.1
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": false,
          "cost": 4.3204,
          "tokens": 1872836,
          "time": 155.9
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": true,
          "cost": 1.8919,
          "tokens": 763345,
          "time": 87.8
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": false,
          "cost": 2.8562,
          "tokens": 920816,
          "time": 99.5
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 2.5108,
          "tokens": 1014071,
          "time": 133.6
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 2.0098,
          "tokens": 792711,
          "time": 109.0
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 1.216,
          "tokens": 509861,
          "time": 60.8
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": true,
          "cost": 2.7292,
          "tokens": 1137406,
          "time": 112.3
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 2.3978,
          "tokens": 960386,
          "time": 104.5
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": true,
          "cost": 1.6247,
          "tokens": 671758,
          "time": 65.2
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": false,
          "cost": 2.4798,
          "tokens": 1003207,
          "time": 108.0
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 3.0118,
          "tokens": 1257031,
          "time": 140.5
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": false,
          "cost": 1.5926,
          "tokens": 707324,
          "time": 104.4
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": false,
          "cost": 4.0142,
          "tokens": 1027978,
          "time": 138.4
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": false,
          "cost": 2.9433,
          "tokens": 1177441,
          "time": 179.8
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": true,
          "cost": 1.301,
          "tokens": 590013,
          "time": 106.0
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": true,
          "cost": 3.2006,
          "tokens": 1275341,
          "time": 159.2
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": false,
          "cost": 1.7056,
          "tokens": 643534,
          "time": 69.6
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": true,
          "cost": 1.4998,
          "tokens": 558837,
          "time": 58.3
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": true,
          "cost": 1.329,
          "tokens": 546369,
          "time": 60.2
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": true,
          "cost": 2.6588,
          "tokens": 998743,
          "time": 102.2
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": false,
          "cost": 2.295,
          "tokens": 885896,
          "time": 122.2
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 1.6269,
          "tokens": 806442,
          "time": 946.8
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 2.1615,
          "tokens": 834193,
          "time": 125.3
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": true,
          "cost": 3.0208,
          "tokens": 1130893,
          "time": 120.0
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": false,
          "cost": 2.653,
          "tokens": 920415,
          "time": 111.2
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 3.5158,
          "tokens": 800296,
          "time": 96.8
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": true,
          "cost": 2.3903,
          "tokens": 954778,
          "time": 121.5
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 2.5448,
          "tokens": 1023077,
          "time": 125.1
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 1.6898,
          "tokens": 654390,
          "time": 65.0
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 1.0305,
          "tokens": 386599,
          "time": 42.2
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": true,
          "cost": 1.9264,
          "tokens": 768694,
          "time": 70.7
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": true,
          "cost": 1.4753,
          "tokens": 664334,
          "time": 68.4
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": true,
          "cost": 2.6051,
          "tokens": 1098012,
          "time": 114.8
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": false,
          "cost": 3.0647,
          "tokens": 1189426,
          "time": 130.5
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": true,
          "cost": 2.8573,
          "tokens": 1034060,
          "time": 106.8
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": false,
          "cost": 2.4992,
          "tokens": 1007921,
          "time": 95.5
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": true,
          "cost": 2.8333,
          "tokens": 1086287,
          "time": 127.2
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": true,
          "cost": 2.6679,
          "tokens": 968825,
          "time": 132.1
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": false,
          "cost": 2.7759,
          "tokens": 1085517,
          "time": 138.8
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": true,
          "cost": 3.3671,
          "tokens": 1243746,
          "time": 123.7
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": true,
          "cost": 2.0454,
          "tokens": 837658,
          "time": 99.8
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": true,
          "cost": 1.0577,
          "tokens": 467622,
          "time": 40.4
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": true,
          "cost": 0.4121,
          "tokens": 329743,
          "time": 81.1
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": false,
          "cost": 1.2744,
          "tokens": 482081,
          "time": 65.4
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": true,
          "cost": 3.0543,
          "tokens": 1221804,
          "time": 121.0
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": true,
          "cost": 2.3878,
          "tokens": 1119877,
          "time": 96.4
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": false,
          "cost": 4.1808,
          "tokens": 1550379,
          "time": 178.6
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": false,
          "cost": 3.3411,
          "tokens": 1267862,
          "time": 138.6
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": true,
          "cost": 2.0056,
          "tokens": 769791,
          "time": 113.0
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": true,
          "cost": 2.0794,
          "tokens": 827574,
          "time": 91.5
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": false,
          "cost": 3.2606,
          "tokens": 1313510,
          "time": 124.0
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": true,
          "cost": 3.8918,
          "tokens": 1715871,
          "time": 167.0
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": true,
          "cost": 2.7131,
          "tokens": 1088096,
          "time": 127.0
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": false,
          "cost": 2.4288,
          "tokens": 1007439,
          "time": 168.7
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": true,
          "cost": 3.047,
          "tokens": 1294031,
          "time": 126.3
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": false,
          "cost": 3.7638,
          "tokens": 1589199,
          "time": 156.6
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": true,
          "cost": 3.2175,
          "tokens": 1387394,
          "time": 163.5
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": true,
          "cost": 2.1565,
          "tokens": 884534,
          "time": 106.0
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": true,
          "cost": 3.7644,
          "tokens": 1452028,
          "time": 157.9
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": true,
          "cost": 2.0749,
          "tokens": 918961,
          "time": 90.6
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": false,
          "cost": 2.3703,
          "tokens": 1030375,
          "time": 124.5
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": true,
          "cost": 2.8767,
          "tokens": 1229379,
          "time": 148.7
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": false,
          "cost": 1.6669,
          "tokens": 717526,
          "time": 94.1
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": true,
          "cost": 1.6991,
          "tokens": 650837,
          "time": 61.1
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": true,
          "cost": 2.4173,
          "tokens": 1128701,
          "time": 107.0
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": false,
          "cost": 4.5115,
          "tokens": 1654638,
          "time": 140.8
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": false,
          "cost": 3.277,
          "tokens": 1457964,
          "time": 204.7
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": false,
          "cost": 2.4312,
          "tokens": 1033647,
          "time": 128.7
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": true,
          "cost": 1.8156,
          "tokens": 771581,
          "time": 89.5
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": true,
          "cost": 2.2454,
          "tokens": 923386,
          "time": 107.7
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": false,
          "cost": 2.4463,
          "tokens": 925982,
          "time": 123.6
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 3.1219,
          "tokens": 1142178,
          "time": 107.3
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 1.7254,
          "tokens": 604591,
          "time": 76.3
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": false,
          "cost": 2.7683,
          "tokens": 1048043,
          "time": 122.1
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": true,
          "cost": 1.9164,
          "tokens": 720468,
          "time": 85.2
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": false,
          "cost": 4.8094,
          "tokens": 2109199,
          "time": 214.7
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": true,
          "cost": 1.9378,
          "tokens": 895445,
          "time": 114.0
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 1.2973,
          "tokens": 549005,
          "time": 71.3
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": false,
          "cost": 2.6476,
          "tokens": 1021794,
          "time": 115.8
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": true,
          "cost": 2.8914,
          "tokens": 1172069,
          "time": 104.8
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": true,
          "cost": 3.0151,
          "tokens": 1209947,
          "time": 156.4
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": true,
          "cost": 1.6388,
          "tokens": 661229,
          "time": 55.7
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": false,
          "cost": 2.4696,
          "tokens": 1074853,
          "time": 120.7
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": false,
          "cost": 2.1979,
          "tokens": 865745,
          "time": 179.2
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": false,
          "cost": 2.7766,
          "tokens": 1074999,
          "time": 100.7
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": true,
          "cost": 2.6813,
          "tokens": 1013363,
          "time": 120.3
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 2.7389,
          "tokens": 992211,
          "time": 84.7
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": true,
          "cost": 1.9543,
          "tokens": 745800,
          "time": 76.5
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": false,
          "cost": 2.2133,
          "tokens": 892215,
          "time": 117.1
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": true,
          "cost": 1.7606,
          "tokens": 733530,
          "time": 72.6
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": true,
          "cost": 2.1784,
          "tokens": 839114,
          "time": 91.3
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 2.8963,
          "tokens": 1145208,
          "time": 136.2
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": false,
          "cost": 2.1131,
          "tokens": 906319,
          "time": 117.9
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 2.7485,
          "tokens": 1252689,
          "time": 130.0
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": false,
          "cost": 5.0773,
          "tokens": 2058594,
          "time": 193.0
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": true,
          "cost": 1.5141,
          "tokens": 696429,
          "time": 84.8
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": true,
          "cost": 1.0773,
          "tokens": 479930,
          "time": 61.2
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": true,
          "cost": 2.103,
          "tokens": 916253,
          "time": 116.2
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": true,
          "cost": 3.0806,
          "tokens": 1548564,
          "time": 593.1
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": true,
          "cost": 2.5133,
          "tokens": 1034092,
          "time": 110.5
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": true,
          "cost": 2.8868,
          "tokens": 1179226,
          "time": 131.0
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 3.0606,
          "tokens": 1339614,
          "time": 151.1
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 2.2178,
          "tokens": 1009898,
          "time": 113.5
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 3.1782,
          "tokens": 1269281,
          "time": 202.1
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": true,
          "cost": 2.7114,
          "tokens": 1093086,
          "time": 119.7
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": false,
          "cost": 2.4964,
          "tokens": 975270,
          "time": 121.7
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": false,
          "cost": 2.5078,
          "tokens": 1051728,
          "time": 107.5
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 3.6875,
          "tokens": 1621443,
          "time": 169.8
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": true,
          "cost": 2.1984,
          "tokens": 919777,
          "time": 90.7
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": false,
          "cost": 3.4875,
          "tokens": 1196734,
          "time": 104.5
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": true,
          "cost": 2.1975,
          "tokens": 737015,
          "time": 95.9
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": true,
          "cost": 3.0385,
          "tokens": 1215938,
          "time": 124.8
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 1.4821,
          "tokens": 642041,
          "time": 62.4
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": false,
          "cost": 2.5331,
          "tokens": 1093628,
          "time": 137.4
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": false,
          "cost": 1.2824,
          "tokens": 544201,
          "time": 71.7
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": false,
          "cost": 1.8603,
          "tokens": 710677,
          "time": 103.0
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": true,
          "cost": 2.1679,
          "tokens": 936557,
          "time": 90.4
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": true,
          "cost": 2.7399,
          "tokens": 1214878,
          "time": 148.7
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 2.1405,
          "tokens": 899888,
          "time": 82.0
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 1.8967,
          "tokens": 817679,
          "time": 88.3
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 1.172,
          "tokens": 516869,
          "time": 49.1
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": true,
          "cost": 0.809,
          "tokens": 465397,
          "time": 209.5
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": false,
          "cost": 3.1236,
          "tokens": 1397792,
          "time": 214.8
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": true,
          "cost": 1.8367,
          "tokens": 669263,
          "time": 86.0
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": true,
          "cost": 0.8347,
          "tokens": 364982,
          "time": 43.3
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": false,
          "cost": 2.7238,
          "tokens": 1147078,
          "time": 129.8
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": false,
          "cost": 1.6888,
          "tokens": 740829,
          "time": 85.5
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 3.5376,
          "tokens": 1230029,
          "time": 136.1
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": false,
          "cost": 2.0663,
          "tokens": 820671,
          "time": 113.9
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": true,
          "cost": 1.976,
          "tokens": 761435,
          "time": 88.2
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": true,
          "cost": 1.5838,
          "tokens": 632932,
          "time": 80.2
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": false,
          "cost": 2.2316,
          "tokens": 903552,
          "time": 100.3
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 2.4692,
          "tokens": 1061600,
          "time": 143.3
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": false,
          "cost": 1.8899,
          "tokens": 705196,
          "time": 84.2
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 1.3614,
          "tokens": 563665,
          "time": 59.2
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 1.7978,
          "tokens": 698315,
          "time": 84.8
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 1.6067,
          "tokens": 679860,
          "time": 77.2
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": true,
          "cost": 4.367,
          "tokens": 1840031,
          "time": 199.9
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": false,
          "cost": 3.8446,
          "tokens": 1709448,
          "time": 177.5
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 2.0767,
          "tokens": 882474,
          "time": 96.6
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": false,
          "cost": 2.4341,
          "tokens": 1058090,
          "time": 107.5
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": false,
          "cost": 2.0424,
          "tokens": 913945,
          "time": 93.5
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 2.5608,
          "tokens": 978485,
          "time": 104.6
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 1.9121,
          "tokens": 792583,
          "time": 115.1
        }
      ]
    },
    {
      "runKey": "rag-gpt-5.5",
      "harness": "trace-rag",
      "model": "gpt-5.5",
      "modelName": "gpt-5.5",
      "reported": {
        "cost": 0.672,
        "tokens": 215000,
        "time": 202,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": false,
          "cost": 1.4942,
          "tokens": 290418,
          "time": 182.5
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": false,
          "cost": 0.2888,
          "tokens": 55128,
          "time": 90.2
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": true,
          "cost": 1.6197,
          "tokens": 314174,
          "time": 267.7
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": false,
          "cost": 0.932,
          "tokens": 175419,
          "time": 177.0
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": false,
          "cost": 1.7593,
          "tokens": 340830,
          "time": 108.9
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": true,
          "cost": 1.5456,
          "tokens": 299156,
          "time": 131.0
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": false,
          "cost": 1.3686,
          "tokens": 265570,
          "time": 164.1
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": true,
          "cost": 1.7324,
          "tokens": 336352,
          "time": 167.6
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": false,
          "cost": 1.4361,
          "tokens": 276517,
          "time": 248.9
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": false,
          "cost": 2.404,
          "tokens": 471602,
          "time": 131.1
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": false,
          "cost": 0.8635,
          "tokens": 165120,
          "time": 122.8
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": false,
          "cost": 1.0026,
          "tokens": 193075,
          "time": 95.3
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": false,
          "cost": 1.0338,
          "tokens": 199775,
          "time": 86.5
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": false,
          "cost": 0.9827,
          "tokens": 187017,
          "time": 102.1
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": false,
          "cost": 1.0219,
          "tokens": 193905,
          "time": 113.8
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": false,
          "cost": 1.5685,
          "tokens": 303337,
          "time": 183.9
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 0.7361,
          "tokens": 140652,
          "time": 373.6
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": false,
          "cost": 0.5453,
          "tokens": 102580,
          "time": 380.0
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": false,
          "cost": 1.4439,
          "tokens": 280710,
          "time": 380.6
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": false,
          "cost": 1.8812,
          "tokens": 365972,
          "time": 433.5
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 1.2469,
          "tokens": 242027,
          "time": 445.6
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": false,
          "cost": 0.9442,
          "tokens": 176545,
          "time": 428.5
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 0.5452,
          "tokens": 101790,
          "time": 257.9
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 0.4983,
          "tokens": 95291,
          "time": 274.6
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": true,
          "cost": 1.3103,
          "tokens": 254953,
          "time": 360.3
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 1.4006,
          "tokens": 266290,
          "time": 440.6
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 0.4514,
          "tokens": 78760,
          "time": 408.4
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 1.5761,
          "tokens": 304468,
          "time": 420.2
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 0.8367,
          "tokens": 148983,
          "time": 420.1
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 0.6489,
          "tokens": 123846,
          "time": 348.1
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": false,
          "cost": 0.909,
          "tokens": 171214,
          "time": 379.2
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": true,
          "cost": 2.165,
          "tokens": 422706,
          "time": 372.8
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": false,
          "cost": 3.5159,
          "tokens": 680500,
          "time": 452.4
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": true,
          "cost": 2.1648,
          "tokens": 420866,
          "time": 357.9
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 0.5449,
          "tokens": 102798,
          "time": 357.7
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": true,
          "cost": 0.6976,
          "tokens": 133727,
          "time": 358.4
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 1.3138,
          "tokens": 250034,
          "time": 388.3
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 0.7876,
          "tokens": 130582,
          "time": 436.9
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": false,
          "cost": 0.97,
          "tokens": 166232,
          "time": 277.6
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 1.835,
          "tokens": 344789,
          "time": 399.2
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": false,
          "cost": 0.4808,
          "tokens": 87169,
          "time": 370.7
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 0.6209,
          "tokens": 115484,
          "time": 261.8
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": false,
          "cost": 0.9233,
          "tokens": 170413,
          "time": 370.9
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": false,
          "cost": 0.9302,
          "tokens": 174193,
          "time": 259.6
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": false,
          "cost": 0.7716,
          "tokens": 147315,
          "time": 362.5
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 0.6658,
          "tokens": 126353,
          "time": 97.3
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": false,
          "cost": 0.7358,
          "tokens": 141453,
          "time": 90.1
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": true,
          "cost": 0.5415,
          "tokens": 102575,
          "time": 91.6
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": false,
          "cost": 3.4524,
          "tokens": 681622,
          "time": 111.1
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": false,
          "cost": 0.7721,
          "tokens": 147958,
          "time": 125.9
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": false,
          "cost": 0.7651,
          "tokens": 143103,
          "time": 119.9
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": false,
          "cost": 2.2012,
          "tokens": 428609,
          "time": 261.7
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": true,
          "cost": 0.8066,
          "tokens": 155705,
          "time": 85.9
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": false,
          "cost": 8.61,
          "tokens": 1698035,
          "time": 359.4
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 0.9831,
          "tokens": 189443,
          "time": 262.8
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 1.2605,
          "tokens": 242853,
          "time": 114.4
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 0.3159,
          "tokens": 59842,
          "time": 75.9
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": false,
          "cost": 0.6267,
          "tokens": 117232,
          "time": 98.6
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 3.0163,
          "tokens": 590522,
          "time": 252.1
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": false,
          "cost": 0.7237,
          "tokens": 137744,
          "time": 160.8
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": false,
          "cost": 0.5426,
          "tokens": 99857,
          "time": 99.6
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 0.9644,
          "tokens": 187099,
          "time": 375.6
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": false,
          "cost": 0.5785,
          "tokens": 108850,
          "time": 432.9
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": false,
          "cost": 1.9337,
          "tokens": 371147,
          "time": 470.4
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": false,
          "cost": 0.5157,
          "tokens": 95175,
          "time": 445.5
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": true,
          "cost": 0.3267,
          "tokens": 60944,
          "time": 432.9
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": true,
          "cost": 0.66,
          "tokens": 124296,
          "time": 408.2
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": true,
          "cost": 1.5869,
          "tokens": 309460,
          "time": 376.0
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": true,
          "cost": 2.8586,
          "tokens": 564723,
          "time": 361.0
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": true,
          "cost": 0.3928,
          "tokens": 74916,
          "time": 372.3
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": false,
          "cost": 1.1839,
          "tokens": 232899,
          "time": 447.7
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": false,
          "cost": 2.2247,
          "tokens": 433406,
          "time": 428.9
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 0.5464,
          "tokens": 103593,
          "time": 264.0
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 0.8493,
          "tokens": 160612,
          "time": 275.9
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": true,
          "cost": 0.5988,
          "tokens": 111288,
          "time": 275.8
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": true,
          "cost": 1.159,
          "tokens": 220775,
          "time": 437.9
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 0.7005,
          "tokens": 133667,
          "time": 399.6
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": false,
          "cost": 1.0786,
          "tokens": 208401,
          "time": 343.9
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 0.6678,
          "tokens": 125035,
          "time": 372.5
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 0.7339,
          "tokens": 139436,
          "time": 357.7
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.4274,
          "tokens": 79297,
          "time": 334.3
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": false,
          "cost": 1.17,
          "tokens": 225736,
          "time": 371.3
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": true,
          "cost": 0.9993,
          "tokens": 191712,
          "time": 365.5
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": true,
          "cost": 0.352,
          "tokens": 64092,
          "time": 77.3
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": true,
          "cost": 1.2259,
          "tokens": 235454,
          "time": 189.4
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": true,
          "cost": 1.3014,
          "tokens": 250549,
          "time": 131.5
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": true,
          "cost": 1.9079,
          "tokens": 370000,
          "time": 333.4
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 1.4624,
          "tokens": 280846,
          "time": 135.4
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": true,
          "cost": 1.2303,
          "tokens": 232908,
          "time": 164.7
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": true,
          "cost": 0.7567,
          "tokens": 140902,
          "time": 160.7
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": true,
          "cost": 0.8319,
          "tokens": 154826,
          "time": 330.0
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 0.7078,
          "tokens": 130150,
          "time": 337.6
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": true,
          "cost": 0.7213,
          "tokens": 139824,
          "time": 295.5
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": true,
          "cost": 0.4794,
          "tokens": 90451,
          "time": 278.6
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": true,
          "cost": 0.5188,
          "tokens": 98567,
          "time": 306.5
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": true,
          "cost": 0.4633,
          "tokens": 85732,
          "time": 304.7
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": true,
          "cost": 0.6873,
          "tokens": 131998,
          "time": 282.1
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": false,
          "cost": 0.4767,
          "tokens": 88779,
          "time": 305.8
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": true,
          "cost": 0.8688,
          "tokens": 164168,
          "time": 325.3
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": true,
          "cost": 0.6725,
          "tokens": 124495,
          "time": 301.7
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": true,
          "cost": 1.9856,
          "tokens": 392253,
          "time": 353.5
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": true,
          "cost": 1.1033,
          "tokens": 208052,
          "time": 379.6
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": true,
          "cost": 1.3982,
          "tokens": 274564,
          "time": 311.5
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": false,
          "cost": 1.2215,
          "tokens": 239235,
          "time": 280.6
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": false,
          "cost": 0.7602,
          "tokens": 145216,
          "time": 261.0
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": false,
          "cost": 2.1306,
          "tokens": 412888,
          "time": 310.9
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": false,
          "cost": 2.6296,
          "tokens": 518995,
          "time": 276.5
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": false,
          "cost": 1.7046,
          "tokens": 334347,
          "time": 275.2
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": true,
          "cost": 0.7244,
          "tokens": 138413,
          "time": 226.5
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": true,
          "cost": 0.503,
          "tokens": 95716,
          "time": 208.2
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": true,
          "cost": 0.937,
          "tokens": 180290,
          "time": 188.9
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": true,
          "cost": 0.8936,
          "tokens": 170843,
          "time": 199.1
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": false,
          "cost": 0.8459,
          "tokens": 160079,
          "time": 192.6
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": true,
          "cost": 0.8832,
          "tokens": 169150,
          "time": 192.5
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": true,
          "cost": 0.9527,
          "tokens": 182087,
          "time": 196.3
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": true,
          "cost": 0.5144,
          "tokens": 95528,
          "time": 204.1
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": true,
          "cost": 0.8164,
          "tokens": 155809,
          "time": 202.8
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": true,
          "cost": 2.5143,
          "tokens": 495798,
          "time": 199.5
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": true,
          "cost": 0.4907,
          "tokens": 92416,
          "time": 170.7
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": true,
          "cost": 0.6597,
          "tokens": 123852,
          "time": 130.9
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": false,
          "cost": 0.5559,
          "tokens": 105597,
          "time": 109.0
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": true,
          "cost": 0.6609,
          "tokens": 124111,
          "time": 127.5
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 1.0271,
          "tokens": 195804,
          "time": 114.2
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 0.8906,
          "tokens": 172000,
          "time": 110.7
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 0.7614,
          "tokens": 147998,
          "time": 98.0
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 0.9457,
          "tokens": 179598,
          "time": 117.5
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": true,
          "cost": 1.199,
          "tokens": 234180,
          "time": 101.1
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": false,
          "cost": 0.3546,
          "tokens": 67586,
          "time": 91.0
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 0.6431,
          "tokens": 122920,
          "time": 114.0
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": false,
          "cost": 0.8658,
          "tokens": 167616,
          "time": 113.9
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": false,
          "cost": 0.8285,
          "tokens": 158031,
          "time": 124.2
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": false,
          "cost": 0.7904,
          "tokens": 152285,
          "time": 112.9
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": true,
          "cost": 1.1248,
          "tokens": 216108,
          "time": 116.1
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": false,
          "cost": 1.3029,
          "tokens": 251203,
          "time": 117.9
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": false,
          "cost": 0.3022,
          "tokens": 52558,
          "time": 107.8
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": false,
          "cost": 1.0281,
          "tokens": 196440,
          "time": 116.1
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 0.8518,
          "tokens": 160480,
          "time": 117.9
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 0.3145,
          "tokens": 58123,
          "time": 91.5
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": true,
          "cost": 0.5466,
          "tokens": 104269,
          "time": 85.9
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": true,
          "cost": 0.5826,
          "tokens": 108695,
          "time": 92.0
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": true,
          "cost": 0.3482,
          "tokens": 64293,
          "time": 75.2
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": true,
          "cost": 0.7412,
          "tokens": 138822,
          "time": 94.1
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 0.8552,
          "tokens": 161804,
          "time": 94.7
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": false,
          "cost": 0.3678,
          "tokens": 67733,
          "time": 75.9
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 0.4279,
          "tokens": 80643,
          "time": 68.5
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": false,
          "cost": 2.4772,
          "tokens": 485727,
          "time": 111.6
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": false,
          "cost": 2.1789,
          "tokens": 422992,
          "time": 113.9
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": false,
          "cost": 3.1272,
          "tokens": 613383,
          "time": 116.3
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": false,
          "cost": 3.1506,
          "tokens": 612095,
          "time": 145.3
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": true,
          "cost": 1.0082,
          "tokens": 184379,
          "time": 124.8
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": false,
          "cost": 1.999,
          "tokens": 390540,
          "time": 107.1
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": true,
          "cost": 2.5378,
          "tokens": 491690,
          "time": 124.5
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 2.7124,
          "tokens": 530419,
          "time": 109.9
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 1.2572,
          "tokens": 241986,
          "time": 103.6
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 1.0493,
          "tokens": 201693,
          "time": 93.7
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": false,
          "cost": 3.1263,
          "tokens": 616445,
          "time": 100.5
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": false,
          "cost": 1.143,
          "tokens": 218645,
          "time": 106.0
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": true,
          "cost": 0.5187,
          "tokens": 98409,
          "time": 82.9
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 2.0813,
          "tokens": 406944,
          "time": 95.6
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": true,
          "cost": 1.1574,
          "tokens": 223265,
          "time": 92.1
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": false,
          "cost": 3.0645,
          "tokens": 602940,
          "time": 104.9
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": false,
          "cost": 1.5027,
          "tokens": 288828,
          "time": 109.2
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": false,
          "cost": 0.7866,
          "tokens": 145483,
          "time": 96.9
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 0.5487,
          "tokens": 103979,
          "time": 62.0
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": true,
          "cost": 1.1819,
          "tokens": 227076,
          "time": 98.0
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": true,
          "cost": 0.7934,
          "tokens": 151764,
          "time": 67.4
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": true,
          "cost": 0.5544,
          "tokens": 105453,
          "time": 65.6
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": true,
          "cost": 0.4467,
          "tokens": 84640,
          "time": 64.3
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": true,
          "cost": 2.6169,
          "tokens": 510874,
          "time": 105.0
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 0.7699,
          "tokens": 148436,
          "time": 57.6
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 0.8944,
          "tokens": 172102,
          "time": 67.1
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.3629,
          "tokens": 67696,
          "time": 50.8
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": true,
          "cost": 1.5944,
          "tokens": 306132,
          "time": 96.0
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": false,
          "cost": 0.6654,
          "tokens": 126264,
          "time": 64.0
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": false,
          "cost": 1.2577,
          "tokens": 244484,
          "time": 68.6
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": false,
          "cost": 1.09,
          "tokens": 209434,
          "time": 66.2
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": true,
          "cost": 0.3089,
          "tokens": 57146,
          "time": 46.6
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": true,
          "cost": 0.8407,
          "tokens": 159156,
          "time": 68.2
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 0.9771,
          "tokens": 184265,
          "time": 75.1
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": false,
          "cost": 0.8733,
          "tokens": 164233,
          "time": 68.2
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": false,
          "cost": 0.3098,
          "tokens": 54265,
          "time": 51.6
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": false,
          "cost": 0.7026,
          "tokens": 131537,
          "time": 67.4
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": false,
          "cost": 0.4492,
          "tokens": 82655,
          "time": 53.6
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 0.1965,
          "tokens": 35762,
          "time": 36.4
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": false,
          "cost": 0.4507,
          "tokens": 82395,
          "time": 58.1
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 0.2001,
          "tokens": 36461,
          "time": 39.8
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 0.2847,
          "tokens": 51684,
          "time": 43.4
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 0.5536,
          "tokens": 103042,
          "time": 59.6
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": true,
          "cost": 0.9711,
          "tokens": 187604,
          "time": 53.9
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": true,
          "cost": 1.2348,
          "tokens": 237889,
          "time": 66.1
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 0.5362,
          "tokens": 100897,
          "time": 40.0
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": false,
          "cost": 0.4589,
          "tokens": 84117,
          "time": 52.8
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": false,
          "cost": 0.9282,
          "tokens": 179749,
          "time": 59.9
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 0.8512,
          "tokens": 163301,
          "time": 57.7
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 0.5825,
          "tokens": 110662,
          "time": 44.9
        }
      ]
    },
    {
      "runKey": "rlm-haiku-4.5",
      "harness": "trace-rlm",
      "model": "claude-haiku-4.5",
      "modelName": "claude-haiku-4.5",
      "reported": {
        "cost": 0.157,
        "tokens": 516000,
        "time": 191,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": false,
          "cost": 0.0879,
          "tokens": 263918,
          "time": 164.8
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": false,
          "cost": 0.2187,
          "tokens": 1013001,
          "time": 257.8
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": false,
          "cost": 0.4856,
          "tokens": 3056694,
          "time": 491.5
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": false,
          "cost": 0.046,
          "tokens": 72113,
          "time": 96.1
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": true,
          "cost": 0.1348,
          "tokens": 499162,
          "time": 210.9
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": false,
          "cost": 0.1055,
          "tokens": 163559,
          "time": 85.8
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": false,
          "cost": 0.0872,
          "tokens": 195989,
          "time": 131.0
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": false,
          "cost": 0.0574,
          "tokens": 145768,
          "time": 93.7
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": true,
          "cost": 0.0754,
          "tokens": 153710,
          "time": 86.8
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": true,
          "cost": 0.082,
          "tokens": 208322,
          "time": 170.9
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": true,
          "cost": 0.0883,
          "tokens": 220974,
          "time": 178.6
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": true,
          "cost": 0.2276,
          "tokens": 477483,
          "time": 215.1
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": false,
          "cost": 0.1815,
          "tokens": 538143,
          "time": 207.9
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": false,
          "cost": 0.0439,
          "tokens": 65923,
          "time": 71.9
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": false,
          "cost": 0.2723,
          "tokens": 551573,
          "time": 238.9
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": false,
          "cost": 0.367,
          "tokens": 432259,
          "time": 175.2
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 0.1599,
          "tokens": 347917,
          "time": 224.8
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": true,
          "cost": 0.1395,
          "tokens": 557767,
          "time": 208.0
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": false,
          "cost": 0.4301,
          "tokens": 2092336,
          "time": 388.8
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": true,
          "cost": 0.246,
          "tokens": 1171018,
          "time": 247.6
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 0.0834,
          "tokens": 271097,
          "time": 192.4
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": true,
          "cost": 0.085,
          "tokens": 223983,
          "time": 172.6
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 0.044,
          "tokens": 65016,
          "time": 77.0
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 0.1138,
          "tokens": 350757,
          "time": 171.4
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": false,
          "cost": 0.1264,
          "tokens": 425136,
          "time": 138.1
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 0.1501,
          "tokens": 616961,
          "time": 212.9
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 0.1556,
          "tokens": 611628,
          "time": 278.8
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": true,
          "cost": 0.1449,
          "tokens": 280173,
          "time": 168.4
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 0.2021,
          "tokens": 822533,
          "time": 264.6
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 0.0595,
          "tokens": 125466,
          "time": 137.0
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": false,
          "cost": 0.1116,
          "tokens": 259929,
          "time": 132.1
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": false,
          "cost": 0.0982,
          "tokens": 273921,
          "time": 166.5
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": true,
          "cost": 0.1648,
          "tokens": 731863,
          "time": 243.4
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": false,
          "cost": 0.2006,
          "tokens": 937496,
          "time": 240.8
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 0.2243,
          "tokens": 1066758,
          "time": 255.3
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": true,
          "cost": 0.1317,
          "tokens": 549312,
          "time": 181.8
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 0.0625,
          "tokens": 148667,
          "time": 112.2
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 0.2317,
          "tokens": 737609,
          "time": 266.9
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": true,
          "cost": 0.4385,
          "tokens": 1317508,
          "time": 358.7
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": true,
          "cost": 0.2619,
          "tokens": 1116815,
          "time": 265.6
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": false,
          "cost": 0.1075,
          "tokens": 325077,
          "time": 224.1
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 0.0938,
          "tokens": 240910,
          "time": 185.6
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": false,
          "cost": 0.089,
          "tokens": 249697,
          "time": 229.8
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": false,
          "cost": 0.1851,
          "tokens": 879794,
          "time": 184.7
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": false,
          "cost": 0.1556,
          "tokens": 577316,
          "time": 208.1
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 0.1399,
          "tokens": 520553,
          "time": 194.2
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": true,
          "cost": 0.031,
          "tokens": 45228,
          "time": 73.6
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": false,
          "cost": 0.1241,
          "tokens": 430756,
          "time": 221.8
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": true,
          "cost": 0.0531,
          "tokens": 110368,
          "time": 73.5
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": false,
          "cost": 0.182,
          "tokens": 844317,
          "time": 211.3
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": false,
          "cost": 0.1733,
          "tokens": 416703,
          "time": 216.6
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": false,
          "cost": 0.2247,
          "tokens": 988613,
          "time": 322.5
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": false,
          "cost": 0.2472,
          "tokens": 1182651,
          "time": 364.9
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": false,
          "cost": 0.1232,
          "tokens": 380829,
          "time": 190.4
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 0.0864,
          "tokens": 277534,
          "time": 107.8
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 0.0697,
          "tokens": 161341,
          "time": 157.2
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 0.0611,
          "tokens": 155109,
          "time": 87.0
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": true,
          "cost": 0.1263,
          "tokens": 457264,
          "time": 249.3
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 0.099,
          "tokens": 282807,
          "time": 192.8
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": true,
          "cost": 0.0997,
          "tokens": 318352,
          "time": 178.0
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": true,
          "cost": 0.0957,
          "tokens": 337350,
          "time": 150.1
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 0.1175,
          "tokens": 402508,
          "time": 183.5
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": false,
          "cost": 0.2244,
          "tokens": 1204756,
          "time": 282.5
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": false,
          "cost": 0.1116,
          "tokens": 355305,
          "time": 165.2
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": true,
          "cost": 0.1628,
          "tokens": 680150,
          "time": 239.0
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": true,
          "cost": 0.0777,
          "tokens": 219572,
          "time": 104.6
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": true,
          "cost": 0.2373,
          "tokens": 374693,
          "time": 119.3
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": false,
          "cost": 0.0428,
          "tokens": 90115,
          "time": 96.9
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": false,
          "cost": 0.2312,
          "tokens": 1218782,
          "time": 374.7
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": false,
          "cost": 0.0643,
          "tokens": 190357,
          "time": 136.6
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": false,
          "cost": 0.1003,
          "tokens": 325693,
          "time": 157.4
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": false,
          "cost": 0.17,
          "tokens": 742680,
          "time": 253.8
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 0.0757,
          "tokens": 162734,
          "time": 110.0
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 0.1288,
          "tokens": 494874,
          "time": 242.9
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": false,
          "cost": 0.0631,
          "tokens": 175935,
          "time": 108.0
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": false,
          "cost": 0.1715,
          "tokens": 595162,
          "time": 207.7
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 0.1064,
          "tokens": 311578,
          "time": 211.7
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": false,
          "cost": 0.1278,
          "tokens": 195052,
          "time": 118.8
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 0.0868,
          "tokens": 220385,
          "time": 105.1
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 0.0456,
          "tokens": 96801,
          "time": 238.5
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.0345,
          "tokens": 40849,
          "time": 40.5
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": true,
          "cost": 0.0667,
          "tokens": 178660,
          "time": 177.2
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": true,
          "cost": 0.1052,
          "tokens": 361082,
          "time": 158.0
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": false,
          "cost": 0.0919,
          "tokens": 256420,
          "time": 176.2
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": false,
          "cost": 0.0367,
          "tokens": 62471,
          "time": 60.7
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": false,
          "cost": 0.2174,
          "tokens": 346542,
          "time": 143.3
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": false,
          "cost": 0.1455,
          "tokens": 476699,
          "time": 204.2
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 0.074,
          "tokens": 199423,
          "time": 160.7
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": true,
          "cost": 0.2176,
          "tokens": 570933,
          "time": 205.9
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": true,
          "cost": 0.1597,
          "tokens": 608276,
          "time": 221.6
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": false,
          "cost": 0.3519,
          "tokens": 1056090,
          "time": 313.9
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 0.0415,
          "tokens": 98058,
          "time": 57.7
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": true,
          "cost": 0.0569,
          "tokens": 148258,
          "time": 73.6
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": true,
          "cost": 0.0622,
          "tokens": 119830,
          "time": 96.9
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": true,
          "cost": 0.0714,
          "tokens": 155839,
          "time": 121.5
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": true,
          "cost": 0.3786,
          "tokens": 1288500,
          "time": 276.4
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": true,
          "cost": 0.3238,
          "tokens": 1284632,
          "time": 282.2
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": true,
          "cost": 0.0832,
          "tokens": 257194,
          "time": 129.5
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": true,
          "cost": 0.1072,
          "tokens": 252898,
          "time": 174.5
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": false,
          "cost": 0.0914,
          "tokens": 294767,
          "time": 115.6
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": true,
          "cost": null,
          "tokens": null,
          "time": 3600.0
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": false,
          "cost": 0.1748,
          "tokens": 806669,
          "time": 203.5
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": true,
          "cost": 0.1124,
          "tokens": 316393,
          "time": 204.2
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": false,
          "cost": 0.2307,
          "tokens": 1000189,
          "time": 271.3
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": true,
          "cost": 0.0746,
          "tokens": 216530,
          "time": 188.6
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": true,
          "cost": 0.0848,
          "tokens": 251994,
          "time": 156.0
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": true,
          "cost": 0.3315,
          "tokens": 1746639,
          "time": 368.2
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": false,
          "cost": 0.3179,
          "tokens": 1643332,
          "time": 384.2
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": true,
          "cost": 0.2389,
          "tokens": 1202608,
          "time": 219.0
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": true,
          "cost": 0.2164,
          "tokens": 731572,
          "time": 980.8
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": true,
          "cost": 0.1175,
          "tokens": 399587,
          "time": 165.8
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": false,
          "cost": 0.0666,
          "tokens": 133449,
          "time": 142.4
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": false,
          "cost": 0.1073,
          "tokens": 400651,
          "time": 157.7
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": true,
          "cost": 0.1246,
          "tokens": 496773,
          "time": 230.5
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": true,
          "cost": 0.0871,
          "tokens": 194196,
          "time": 130.2
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": true,
          "cost": 0.0534,
          "tokens": 135356,
          "time": 85.4
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": false,
          "cost": 0.1556,
          "tokens": 578112,
          "time": 155.1
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": false,
          "cost": 0.5574,
          "tokens": 3234837,
          "time": 541.6
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": true,
          "cost": 0.2754,
          "tokens": 1385439,
          "time": 256.0
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": true,
          "cost": 0.3278,
          "tokens": 485133,
          "time": 169.7
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": false,
          "cost": 0.1993,
          "tokens": 495861,
          "time": 248.9
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": false,
          "cost": 0.0763,
          "tokens": 229951,
          "time": 144.9
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 0.1177,
          "tokens": 417923,
          "time": 205.5
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 0.2163,
          "tokens": 344345,
          "time": 157.9
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 0.0683,
          "tokens": 171725,
          "time": 75.0
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 0.1025,
          "tokens": 367525,
          "time": 155.7
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": false,
          "cost": 0.2118,
          "tokens": 358085,
          "time": 196.6
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": true,
          "cost": 0.1127,
          "tokens": 440404,
          "time": 156.4
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 0.0913,
          "tokens": 258057,
          "time": 145.6
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": false,
          "cost": 0.0953,
          "tokens": 317819,
          "time": 119.8
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": false,
          "cost": 0.088,
          "tokens": 278112,
          "time": 166.6
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": false,
          "cost": 0.1462,
          "tokens": 421758,
          "time": 187.5
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": false,
          "cost": 0.0855,
          "tokens": 265998,
          "time": 149.0
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": false,
          "cost": 0.1469,
          "tokens": 627179,
          "time": 157.5
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": false,
          "cost": 0.1089,
          "tokens": 326267,
          "time": 175.1
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": false,
          "cost": 0.0573,
          "tokens": 140430,
          "time": 109.3
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 0.1062,
          "tokens": 333726,
          "time": 215.1
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 0.1145,
          "tokens": 424477,
          "time": 212.0
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": true,
          "cost": 0.3122,
          "tokens": 643666,
          "time": 172.9
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": false,
          "cost": 0.0621,
          "tokens": 182629,
          "time": 59.3
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": true,
          "cost": 0.0743,
          "tokens": 126091,
          "time": 96.4
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": false,
          "cost": 0.0693,
          "tokens": 174540,
          "time": 93.7
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 0.1358,
          "tokens": 453756,
          "time": 113.2
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": true,
          "cost": 0.1779,
          "tokens": 300407,
          "time": 147.1
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 0.097,
          "tokens": 313432,
          "time": 157.8
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": true,
          "cost": 0.1651,
          "tokens": 640889,
          "time": 208.0
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": false,
          "cost": 0.4007,
          "tokens": 1994800,
          "time": 426.1
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": false,
          "cost": 0.1133,
          "tokens": 426069,
          "time": 157.3
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": false,
          "cost": 0.294,
          "tokens": 1428879,
          "time": 441.6
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": true,
          "cost": 0.1675,
          "tokens": 574301,
          "time": 209.9
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": true,
          "cost": 0.0681,
          "tokens": 129785,
          "time": 121.3
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": false,
          "cost": 0.1374,
          "tokens": 416632,
          "time": 216.0
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 0.4527,
          "tokens": 1737435,
          "time": 369.1
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 0.2663,
          "tokens": 1434353,
          "time": 262.5
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 0.152,
          "tokens": 619857,
          "time": 177.0
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": false,
          "cost": 0.1705,
          "tokens": 759536,
          "time": 1063.7
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": false,
          "cost": 0.1236,
          "tokens": 455777,
          "time": 144.7
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": true,
          "cost": 0.1575,
          "tokens": 642161,
          "time": 158.5
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 0.0921,
          "tokens": 232942,
          "time": 112.0
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": false,
          "cost": 0.0643,
          "tokens": 196186,
          "time": 103.3
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": false,
          "cost": 0.1252,
          "tokens": 406373,
          "time": 198.7
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": false,
          "cost": 0.3768,
          "tokens": 2209224,
          "time": 318.6
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": false,
          "cost": 0.7273,
          "tokens": 1821572,
          "time": 522.3
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 0.0507,
          "tokens": 122205,
          "time": 59.1
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": true,
          "cost": 0.0564,
          "tokens": 148176,
          "time": 98.6
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": true,
          "cost": 0.0405,
          "tokens": 59678,
          "time": 48.5
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": true,
          "cost": 0.0491,
          "tokens": 115460,
          "time": 92.0
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": true,
          "cost": 0.0584,
          "tokens": 139632,
          "time": 102.0
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": true,
          "cost": 0.1378,
          "tokens": 401780,
          "time": 255.6
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 0.0544,
          "tokens": 98236,
          "time": 84.3
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 0.0524,
          "tokens": 136126,
          "time": 68.8
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.046,
          "tokens": 111043,
          "time": 75.2
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": false,
          "cost": 0.1679,
          "tokens": 702276,
          "time": 286.8
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": false,
          "cost": 0.1971,
          "tokens": 483449,
          "time": 190.4
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": true,
          "cost": 0.0986,
          "tokens": 282077,
          "time": 140.0
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": true,
          "cost": 0.0609,
          "tokens": 157260,
          "time": 92.0
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": true,
          "cost": 0.0862,
          "tokens": 213498,
          "time": 77.1
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": true,
          "cost": 0.0609,
          "tokens": 122851,
          "time": 61.2
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 1.1244,
          "tokens": 1413932,
          "time": 194.6
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": false,
          "cost": 0.1764,
          "tokens": 767115,
          "time": 310.6
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": false,
          "cost": 0.0777,
          "tokens": 233906,
          "time": 101.2
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": false,
          "cost": 0.0984,
          "tokens": 274133,
          "time": 152.8
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": false,
          "cost": 0.0821,
          "tokens": 260837,
          "time": 141.6
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 0.048,
          "tokens": 109372,
          "time": 99.0
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": true,
          "cost": 0.365,
          "tokens": 1110026,
          "time": 323.9
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 0.0715,
          "tokens": 95029,
          "time": 66.0
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 0.1009,
          "tokens": 320302,
          "time": 234.2
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 0.0635,
          "tokens": 124473,
          "time": 140.2
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": false,
          "cost": 0.1665,
          "tokens": 369930,
          "time": 165.9
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": false,
          "cost": 1.2742,
          "tokens": 1639078,
          "time": 384.5
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 0.0378,
          "tokens": 64426,
          "time": 83.0
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": true,
          "cost": 0.2492,
          "tokens": 1157609,
          "time": 395.2
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": false,
          "cost": 0.0844,
          "tokens": 215308,
          "time": 112.6
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 0.0738,
          "tokens": 146146,
          "time": 114.7
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 0.0529,
          "tokens": 74451,
          "time": 105.9
        }
      ]
    },
    {
      "runKey": "rag-opus-4.8",
      "harness": "trace-rag",
      "model": "claude-opus-4.8",
      "modelName": "claude-opus-4.8",
      "reported": {
        "cost": 1.016,
        "tokens": 191000,
        "time": 184,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": true,
          "cost": 1.6201,
          "tokens": 312860,
          "time": 169.8
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": true,
          "cost": 0.7958,
          "tokens": 151874,
          "time": 146.9
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": true,
          "cost": 0.745,
          "tokens": 137528,
          "time": 135.0
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": true,
          "cost": 1.5599,
          "tokens": 296967,
          "time": 215.4
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": false,
          "cost": 0.9236,
          "tokens": 169779,
          "time": 136.3
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": true,
          "cost": 0.9586,
          "tokens": 177205,
          "time": 169.7
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": false,
          "cost": 2.2001,
          "tokens": 421383,
          "time": 223.2
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": true,
          "cost": 0.614,
          "tokens": 114546,
          "time": 135.3
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": false,
          "cost": 1.9013,
          "tokens": 363375,
          "time": 232.2
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": true,
          "cost": 0.9374,
          "tokens": 180563,
          "time": 117.0
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": false,
          "cost": 0.7395,
          "tokens": 139513,
          "time": 148.6
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": true,
          "cost": 1.9124,
          "tokens": 371302,
          "time": 108.5
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": false,
          "cost": 1.5345,
          "tokens": 292840,
          "time": 154.7
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": false,
          "cost": 0.8971,
          "tokens": 169050,
          "time": 135.7
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": false,
          "cost": 0.6859,
          "tokens": 127309,
          "time": 147.4
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": false,
          "cost": 1.564,
          "tokens": 298510,
          "time": 169.1
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": true,
          "cost": 0.6895,
          "tokens": 128593,
          "time": 339.3
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": false,
          "cost": 0.7377,
          "tokens": 135286,
          "time": 322.5
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": false,
          "cost": 0.7177,
          "tokens": 135856,
          "time": 222.9
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": false,
          "cost": 0.9406,
          "tokens": 178429,
          "time": 366.8
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 0.6546,
          "tokens": 122314,
          "time": 200.8
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": true,
          "cost": 0.7524,
          "tokens": 139767,
          "time": 380.4
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 0.9177,
          "tokens": 171482,
          "time": 215.6
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 0.6032,
          "tokens": 113496,
          "time": 309.4
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": false,
          "cost": 0.917,
          "tokens": 170976,
          "time": 356.8
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 0.6383,
          "tokens": 115342,
          "time": 340.6
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 0.3128,
          "tokens": 56317,
          "time": 350.1
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 0.3256,
          "tokens": 58317,
          "time": 308.4
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 0.9284,
          "tokens": 167259,
          "time": 310.9
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 0.4176,
          "tokens": 76256,
          "time": 271.3
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": false,
          "cost": 0.6133,
          "tokens": 111137,
          "time": 275.8
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": false,
          "cost": 1.5937,
          "tokens": 305606,
          "time": 287.1
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": false,
          "cost": 1.8249,
          "tokens": 345088,
          "time": 275.1
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": false,
          "cost": 0.7434,
          "tokens": 137754,
          "time": 199.6
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 0.5283,
          "tokens": 94249,
          "time": 354.5
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": true,
          "cost": 0.196,
          "tokens": 33643,
          "time": 200.9
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 0.5044,
          "tokens": 88566,
          "time": 285.5
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 0.6512,
          "tokens": 114138,
          "time": 220.4
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": false,
          "cost": 0.5762,
          "tokens": 97432,
          "time": 168.3
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 1.182,
          "tokens": 214668,
          "time": 254.3
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": false,
          "cost": 0.8084,
          "tokens": 149249,
          "time": 352.8
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 1.1916,
          "tokens": 221876,
          "time": 323.5
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": true,
          "cost": 0.7308,
          "tokens": 128642,
          "time": 309.8
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": false,
          "cost": 1.4759,
          "tokens": 279024,
          "time": 356.9
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": true,
          "cost": 0.4666,
          "tokens": 84055,
          "time": 319.9
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 0.9648,
          "tokens": 180110,
          "time": 135.9
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": false,
          "cost": 0.4628,
          "tokens": 84106,
          "time": 134.9
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": true,
          "cost": 0.4938,
          "tokens": 88890,
          "time": 99.8
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": true,
          "cost": 1.6644,
          "tokens": 323781,
          "time": 135.6
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": true,
          "cost": 0.9849,
          "tokens": 182691,
          "time": 157.3
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": false,
          "cost": 0.6331,
          "tokens": 114262,
          "time": 135.3
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": false,
          "cost": 1.2684,
          "tokens": 243631,
          "time": 134.6
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": true,
          "cost": 1.4477,
          "tokens": 276762,
          "time": 161.8
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": false,
          "cost": 1.8105,
          "tokens": 347126,
          "time": 116.2
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 1.6064,
          "tokens": 307435,
          "time": 146.0
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 1.9966,
          "tokens": 382584,
          "time": 162.2
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 0.2692,
          "tokens": 46090,
          "time": 98.3
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": true,
          "cost": 0.3051,
          "tokens": 53371,
          "time": 79.2
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 0.9139,
          "tokens": 172485,
          "time": 136.0
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": true,
          "cost": 0.4934,
          "tokens": 90577,
          "time": 111.6
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": true,
          "cost": 0.7994,
          "tokens": 147545,
          "time": 155.1
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 0.8367,
          "tokens": 158183,
          "time": 262.8
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": true,
          "cost": 0.7219,
          "tokens": 128926,
          "time": 424.8
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": false,
          "cost": 0.9139,
          "tokens": 166356,
          "time": 393.0
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": false,
          "cost": 1.184,
          "tokens": 225624,
          "time": 287.4
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": true,
          "cost": 0.5391,
          "tokens": 99287,
          "time": 367.0
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": true,
          "cost": 1.3744,
          "tokens": 259998,
          "time": 422.9
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": false,
          "cost": 1.4539,
          "tokens": 279593,
          "time": 381.1
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": false,
          "cost": 1.7109,
          "tokens": 333096,
          "time": 373.6
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": true,
          "cost": 0.3004,
          "tokens": 55088,
          "time": 322.1
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": false,
          "cost": 2.3274,
          "tokens": 451478,
          "time": 379.5
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": false,
          "cost": 2.1363,
          "tokens": 407018,
          "time": 393.2
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 0.5673,
          "tokens": 105870,
          "time": 322.7
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 0.4035,
          "tokens": 74670,
          "time": 201.0
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": true,
          "cost": 0.3583,
          "tokens": 62275,
          "time": 409.0
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": false,
          "cost": 1.0075,
          "tokens": 187864,
          "time": 221.9
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 1.157,
          "tokens": 220177,
          "time": 285.7
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": false,
          "cost": 1.9609,
          "tokens": 377837,
          "time": 323.2
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 0.6543,
          "tokens": 117805,
          "time": 327.6
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 0.3533,
          "tokens": 63190,
          "time": 211.8
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.2499,
          "tokens": 44691,
          "time": 347.8
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": false,
          "cost": 3.6526,
          "tokens": 714815,
          "time": 381.6
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": true,
          "cost": 0.417,
          "tokens": 76739,
          "time": 340.8
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": true,
          "cost": 0.6613,
          "tokens": 123474,
          "time": 135.8
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": false,
          "cost": 0.7671,
          "tokens": 136405,
          "time": 169.4
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": true,
          "cost": 0.6491,
          "tokens": 118256,
          "time": 155.1
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": true,
          "cost": 1.2246,
          "tokens": 233302,
          "time": 136.1
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 0.6118,
          "tokens": 109347,
          "time": 161.6
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": true,
          "cost": 0.9469,
          "tokens": 171174,
          "time": 169.3
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": false,
          "cost": 1.0844,
          "tokens": 202520,
          "time": 145.9
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": false,
          "cost": 0.8489,
          "tokens": 160621,
          "time": 245.2
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 1.0787,
          "tokens": 200014,
          "time": 225.0
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": false,
          "cost": 1.2576,
          "tokens": 238025,
          "time": 189.9
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": true,
          "cost": 1.5503,
          "tokens": 295329,
          "time": 193.2
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": false,
          "cost": 0.394,
          "tokens": 67159,
          "time": 260.8
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": true,
          "cost": 1.5177,
          "tokens": 292207,
          "time": 190.5
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": false,
          "cost": 0.8269,
          "tokens": 151688,
          "time": 205.7
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": false,
          "cost": 0.7115,
          "tokens": 134890,
          "time": 177.7
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": true,
          "cost": 1.2949,
          "tokens": 246834,
          "time": 205.3
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": true,
          "cost": 0.7309,
          "tokens": 136656,
          "time": 174.4
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": true,
          "cost": 5.1216,
          "tokens": 1010902,
          "time": 283.8
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": false,
          "cost": 1.3922,
          "tokens": 263817,
          "time": 212.7
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": true,
          "cost": 0.879,
          "tokens": 168080,
          "time": 225.3
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": false,
          "cost": 1.5406,
          "tokens": 296529,
          "time": 204.1
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": false,
          "cost": 1.2326,
          "tokens": 234905,
          "time": 223.6
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": false,
          "cost": 1.6453,
          "tokens": 316359,
          "time": 211.8
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": false,
          "cost": 2.4919,
          "tokens": 485536,
          "time": 258.0
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": true,
          "cost": 1.3262,
          "tokens": 254938,
          "time": 215.2
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": true,
          "cost": 0.3297,
          "tokens": 59210,
          "time": 160.9
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": true,
          "cost": 0.4523,
          "tokens": 82017,
          "time": 207.9
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": true,
          "cost": 1.3952,
          "tokens": 267181,
          "time": 195.1
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": false,
          "cost": 0.9426,
          "tokens": 176470,
          "time": 179.3
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": true,
          "cost": 0.737,
          "tokens": 134387,
          "time": 187.1
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": false,
          "cost": 0.6285,
          "tokens": 113278,
          "time": 160.7
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": true,
          "cost": 0.3406,
          "tokens": 60500,
          "time": 127.7
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": false,
          "cost": 0.6103,
          "tokens": 110807,
          "time": 132.6
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": false,
          "cost": 1.0761,
          "tokens": 201453,
          "time": 160.0
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": false,
          "cost": 0.6544,
          "tokens": 120206,
          "time": 150.8
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": false,
          "cost": 0.4144,
          "tokens": 72306,
          "time": 145.0
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": false,
          "cost": 1.0099,
          "tokens": 191365,
          "time": 145.7
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": false,
          "cost": 1.8816,
          "tokens": 356475,
          "time": 179.2
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": true,
          "cost": 0.531,
          "tokens": 99089,
          "time": 120.2
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 0.8801,
          "tokens": 166540,
          "time": 142.7
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 0.3018,
          "tokens": 55166,
          "time": 103.8
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 0.3089,
          "tokens": 56060,
          "time": 100.5
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 0.6572,
          "tokens": 121863,
          "time": 122.1
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": false,
          "cost": 1.2183,
          "tokens": 234045,
          "time": 126.0
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": false,
          "cost": 2.2664,
          "tokens": 436763,
          "time": 177.8
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 0.4919,
          "tokens": 90761,
          "time": 146.1
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": false,
          "cost": 0.6531,
          "tokens": 122245,
          "time": 134.9
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": false,
          "cost": 0.6502,
          "tokens": 121639,
          "time": 126.0
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": false,
          "cost": 2.0311,
          "tokens": 388247,
          "time": 176.9
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": true,
          "cost": 0.4009,
          "tokens": 72165,
          "time": 137.3
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": false,
          "cost": 0.7922,
          "tokens": 144401,
          "time": 148.6
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": true,
          "cost": 0.6719,
          "tokens": 124379,
          "time": 121.4
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": false,
          "cost": 1.1902,
          "tokens": 223886,
          "time": 151.4
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": true,
          "cost": 0.5525,
          "tokens": 101142,
          "time": 111.5
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 0.6324,
          "tokens": 118825,
          "time": 108.9
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": true,
          "cost": 0.2902,
          "tokens": 49148,
          "time": 99.9
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": false,
          "cost": 1.8229,
          "tokens": 348627,
          "time": 158.3
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": true,
          "cost": 0.6698,
          "tokens": 123930,
          "time": 117.4
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": true,
          "cost": 0.9109,
          "tokens": 170153,
          "time": 117.5
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 0.6713,
          "tokens": 124243,
          "time": 117.5
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": false,
          "cost": 0.623,
          "tokens": 115741,
          "time": 109.0
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 0.7214,
          "tokens": 131271,
          "time": 122.5
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": false,
          "cost": 1.2467,
          "tokens": 235393,
          "time": 152.0
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": false,
          "cost": 1.9182,
          "tokens": 364845,
          "time": 183.0
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": false,
          "cost": 1.3616,
          "tokens": 256428,
          "time": 158.8
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": false,
          "cost": 1.9397,
          "tokens": 367506,
          "time": 167.6
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": true,
          "cost": 1.0036,
          "tokens": 183494,
          "time": 139.4
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": true,
          "cost": 1.1457,
          "tokens": 220201,
          "time": 120.5
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": true,
          "cost": 0.7693,
          "tokens": 142773,
          "time": 108.8
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 2.7705,
          "tokens": 541040,
          "time": 177.3
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 1.2755,
          "tokens": 240110,
          "time": 116.5
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 4.6603,
          "tokens": 912258,
          "time": 208.8
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": true,
          "cost": 0.8134,
          "tokens": 152527,
          "time": 88.9
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": false,
          "cost": 1.4468,
          "tokens": 273018,
          "time": 158.5
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": false,
          "cost": 1.3129,
          "tokens": 246740,
          "time": 134.6
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 2.2012,
          "tokens": 427853,
          "time": 145.5
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": true,
          "cost": 0.3599,
          "tokens": 63201,
          "time": 80.5
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": false,
          "cost": 1.6747,
          "tokens": 322939,
          "time": 142.5
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": false,
          "cost": 0.771,
          "tokens": 143465,
          "time": 114.1
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": false,
          "cost": 0.5315,
          "tokens": 94005,
          "time": 108.8
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 0.4972,
          "tokens": 92664,
          "time": 73.5
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": true,
          "cost": 1.0116,
          "tokens": 191122,
          "time": 108.6
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": false,
          "cost": 0.6715,
          "tokens": 122837,
          "time": 75.2
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": true,
          "cost": 0.5228,
          "tokens": 95489,
          "time": 80.2
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": true,
          "cost": 0.3382,
          "tokens": 61898,
          "time": 67.1
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": false,
          "cost": 1.237,
          "tokens": 236444,
          "time": 104.3
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 0.6208,
          "tokens": 116126,
          "time": 70.2
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 0.724,
          "tokens": 136226,
          "time": 85.0
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.4853,
          "tokens": 90112,
          "time": 59.4
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": true,
          "cost": 0.8222,
          "tokens": 149038,
          "time": 104.8
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": false,
          "cost": 0.609,
          "tokens": 107076,
          "time": 91.6
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": true,
          "cost": 0.3747,
          "tokens": 67524,
          "time": 59.3
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": false,
          "cost": 0.7073,
          "tokens": 128073,
          "time": 93.0
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": false,
          "cost": 1.7905,
          "tokens": 340415,
          "time": 119.5
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": false,
          "cost": 0.4919,
          "tokens": 90882,
          "time": 54.0
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 1.4016,
          "tokens": 261927,
          "time": 123.1
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": false,
          "cost": 0.7323,
          "tokens": 128908,
          "time": 109.5
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": true,
          "cost": 0.6558,
          "tokens": 119629,
          "time": 80.7
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": true,
          "cost": 0.5647,
          "tokens": 102921,
          "time": 76.2
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": false,
          "cost": 1.9287,
          "tokens": 370429,
          "time": 121.6
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 1.3254,
          "tokens": 250428,
          "time": 106.6
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": false,
          "cost": 1.0509,
          "tokens": 198936,
          "time": 87.5
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 0.4236,
          "tokens": 76671,
          "time": 62.9
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 0.9183,
          "tokens": 167124,
          "time": 100.7
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 0.7928,
          "tokens": 144302,
          "time": 82.7
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": false,
          "cost": 0.8964,
          "tokens": 169364,
          "time": 80.2
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": false,
          "cost": 0.6777,
          "tokens": 124303,
          "time": 79.3
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 0.4378,
          "tokens": 79960,
          "time": 59.9
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": false,
          "cost": 0.3187,
          "tokens": 56005,
          "time": 56.5
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": false,
          "cost": 0.5696,
          "tokens": 105810,
          "time": 43.9
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 1.3735,
          "tokens": 260273,
          "time": 86.7
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 1.1357,
          "tokens": 211590,
          "time": 92.3
        }
      ]
    },
    {
      "runKey": "hermes-gpt-5.5",
      "harness": "hermes",
      "model": "gpt-5.5",
      "modelName": "gpt-5.5",
      "reported": {
        "cost": 1.527,
        "tokens": 100000,
        "time": 145,
        "tokensEstimated": true
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": false,
          "cost": 0.5105,
          "tokens": null,
          "time": 93.3
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": false,
          "cost": 0.9373,
          "tokens": null,
          "time": 117.9
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": true,
          "cost": 2.7963,
          "tokens": null,
          "time": 194.3
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": false,
          "cost": 1.9259,
          "tokens": null,
          "time": 122.6
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": false,
          "cost": 0.724,
          "tokens": null,
          "time": 118.5
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": false,
          "cost": 0.4182,
          "tokens": null,
          "time": 62.0
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": false,
          "cost": 1.09,
          "tokens": null,
          "time": 164.4
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": false,
          "cost": 0.0001,
          "tokens": null,
          "time": 81.7
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": false,
          "cost": 0.828,
          "tokens": null,
          "time": 183.1
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": true,
          "cost": 0.0001,
          "tokens": null,
          "time": 65.2
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": false,
          "cost": 1.4942,
          "tokens": null,
          "time": 92.5
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": true,
          "cost": 3.3633,
          "tokens": null,
          "time": 184.8
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": false,
          "cost": 0.7238,
          "tokens": null,
          "time": 75.1
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": false,
          "cost": 0.7208,
          "tokens": null,
          "time": 129.0
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": false,
          "cost": 0.3513,
          "tokens": null,
          "time": 77.4
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": false,
          "cost": 0.7656,
          "tokens": null,
          "time": 90.5
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 0.7525,
          "tokens": null,
          "time": 93.7
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": false,
          "cost": 0.3662,
          "tokens": null,
          "time": 101.0
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": true,
          "cost": 4.4553,
          "tokens": null,
          "time": 264.4
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": false,
          "cost": 0.0001,
          "tokens": null,
          "time": 12.7
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 0.0001,
          "tokens": null,
          "time": 169.9
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": true,
          "cost": 1.1227,
          "tokens": null,
          "time": 129.1
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 4.5597,
          "tokens": null,
          "time": 157.4
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 1.7408,
          "tokens": null,
          "time": 123.9
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": false,
          "cost": 0.0001,
          "tokens": null,
          "time": 59.7
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 1.1587,
          "tokens": null,
          "time": 96.3
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 1.8328,
          "tokens": null,
          "time": 158.5
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 2.8442,
          "tokens": null,
          "time": 201.9
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 1.6269,
          "tokens": null,
          "time": 161.9
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 0.2951,
          "tokens": null,
          "time": 74.3
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": false,
          "cost": 1.249,
          "tokens": null,
          "time": 132.3
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": true,
          "cost": 3.2846,
          "tokens": null,
          "time": 152.3
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": false,
          "cost": 0.0001,
          "tokens": null,
          "time": 143.4
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": false,
          "cost": 0.0001,
          "tokens": null,
          "time": 24.4
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 3.7621,
          "tokens": null,
          "time": 200.1
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": true,
          "cost": 1.3261,
          "tokens": null,
          "time": 125.7
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 0.806,
          "tokens": null,
          "time": 126.5
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 1.5638,
          "tokens": null,
          "time": 201.0
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": false,
          "cost": 2.5595,
          "tokens": null,
          "time": 213.2
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 2.0134,
          "tokens": null,
          "time": 155.6
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": true,
          "cost": 0.6233,
          "tokens": null,
          "time": 93.9
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 0.0001,
          "tokens": null,
          "time": 58.0
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": false,
          "cost": 0.4847,
          "tokens": null,
          "time": 139.3
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": false,
          "cost": 0.7527,
          "tokens": null,
          "time": 70.5
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": false,
          "cost": 0.485,
          "tokens": null,
          "time": 74.9
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 3.1581,
          "tokens": null,
          "time": 125.5
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": false,
          "cost": 0.8478,
          "tokens": null,
          "time": 104.7
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": true,
          "cost": 1.4379,
          "tokens": null,
          "time": 85.1
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": true,
          "cost": 1.9266,
          "tokens": null,
          "time": 89.5
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": false,
          "cost": 0.5821,
          "tokens": null,
          "time": 88.7
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": true,
          "cost": 1.0788,
          "tokens": null,
          "time": 151.9
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": true,
          "cost": 1.6585,
          "tokens": null,
          "time": 97.2
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": false,
          "cost": 2.2045,
          "tokens": null,
          "time": 192.3
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": true,
          "cost": 1.9466,
          "tokens": null,
          "time": 157.0
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 0.0001,
          "tokens": null,
          "time": 104.5
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 1.0585,
          "tokens": null,
          "time": 119.7
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 1.8927,
          "tokens": null,
          "time": 106.2
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": true,
          "cost": 0.0001,
          "tokens": null,
          "time": 94.0
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 1.0426,
          "tokens": null,
          "time": 121.7
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": true,
          "cost": 0.3637,
          "tokens": null,
          "time": 58.6
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": false,
          "cost": 1.3804,
          "tokens": null,
          "time": 94.7
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 1.3854,
          "tokens": null,
          "time": 111.0
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": false,
          "cost": 0.0001,
          "tokens": null,
          "time": 62.9
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": false,
          "cost": 2.071,
          "tokens": null,
          "time": 142.2
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": false,
          "cost": 1.989,
          "tokens": null,
          "time": 192.3
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": true,
          "cost": 1.1256,
          "tokens": null,
          "time": 90.7
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": false,
          "cost": 2.6215,
          "tokens": null,
          "time": 122.7
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": true,
          "cost": 2.3128,
          "tokens": null,
          "time": 126.5
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": true,
          "cost": 1.4743,
          "tokens": null,
          "time": 108.4
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": true,
          "cost": 2.2466,
          "tokens": null,
          "time": 113.2
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": false,
          "cost": 0.9167,
          "tokens": null,
          "time": 80.8
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": false,
          "cost": 0.0001,
          "tokens": null,
          "time": 54.6
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 3.6887,
          "tokens": null,
          "time": 175.8
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 0.949,
          "tokens": null,
          "time": 185.2
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": false,
          "cost": 0.0001,
          "tokens": null,
          "time": 68.4
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": false,
          "cost": 0.7895,
          "tokens": null,
          "time": 132.6
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 1.6832,
          "tokens": null,
          "time": 103.9
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": false,
          "cost": 1.1429,
          "tokens": null,
          "time": 103.6
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 0.0001,
          "tokens": null,
          "time": 78.1
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 1.8696,
          "tokens": null,
          "time": 96.9
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.8971,
          "tokens": null,
          "time": 92.0
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": false,
          "cost": 1.4066,
          "tokens": null,
          "time": 123.5
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": false,
          "cost": 0.9989,
          "tokens": null,
          "time": 91.1
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": true,
          "cost": 1.7512,
          "tokens": null,
          "time": 108.0
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": false,
          "cost": 0.5366,
          "tokens": null,
          "time": 76.6
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": false,
          "cost": 2.8711,
          "tokens": null,
          "time": 87.8
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": true,
          "cost": 0.5459,
          "tokens": null,
          "time": 98.4
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 3.884,
          "tokens": null,
          "time": 153.6
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": true,
          "cost": 2.3016,
          "tokens": null,
          "time": 174.8
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": false,
          "cost": 2.0605,
          "tokens": null,
          "time": 130.4
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": false,
          "cost": 0.6733,
          "tokens": null,
          "time": 106.6
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 2.2298,
          "tokens": null,
          "time": 137.7
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": true,
          "cost": 1.5375,
          "tokens": null,
          "time": 121.7
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": true,
          "cost": 0.8057,
          "tokens": null,
          "time": 74.8
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": true,
          "cost": 0.6655,
          "tokens": null,
          "time": 95.1
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": false,
          "cost": 2.6466,
          "tokens": null,
          "time": 123.1
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": false,
          "cost": 1.0204,
          "tokens": null,
          "time": 79.2
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": false,
          "cost": 0.0001,
          "tokens": null,
          "time": 81.5
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": true,
          "cost": 3.1951,
          "tokens": null,
          "time": 157.6
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": false,
          "cost": 1.8302,
          "tokens": null,
          "time": 131.8
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": false,
          "cost": 1.7816,
          "tokens": null,
          "time": 95.8
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": false,
          "cost": 1.3612,
          "tokens": null,
          "time": 122.4
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": false,
          "cost": 0.0001,
          "tokens": null,
          "time": 55.2
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": false,
          "cost": 0.0001,
          "tokens": null,
          "time": 70.1
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": false,
          "cost": 2.4782,
          "tokens": null,
          "time": 146.9
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": false,
          "cost": 5.6814,
          "tokens": null,
          "time": 164.8
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": true,
          "cost": 0.8701,
          "tokens": null,
          "time": 76.2
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": false,
          "cost": 2.109,
          "tokens": null,
          "time": 137.4
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": false,
          "cost": 0.0001,
          "tokens": null,
          "time": 61.9
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": false,
          "cost": 2.3561,
          "tokens": null,
          "time": 111.1
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": true,
          "cost": 1.6379,
          "tokens": null,
          "time": 152.0
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": false,
          "cost": 0.9272,
          "tokens": null,
          "time": 81.0
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": false,
          "cost": 1.1956,
          "tokens": null,
          "time": 122.2
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": true,
          "cost": 0.6471,
          "tokens": null,
          "time": 72.9
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": true,
          "cost": 0.826,
          "tokens": null,
          "time": 87.1
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": true,
          "cost": 0.7755,
          "tokens": null,
          "time": 85.9
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": true,
          "cost": 1.5652,
          "tokens": null,
          "time": 90.2
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": false,
          "cost": 1.3472,
          "tokens": null,
          "time": 108.8
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": false,
          "cost": 2.1627,
          "tokens": null,
          "time": 103.2
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": true,
          "cost": 1.273,
          "tokens": null,
          "time": 118.3
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": false,
          "cost": 0.2948,
          "tokens": null,
          "time": 75.3
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": true,
          "cost": 2.0838,
          "tokens": null,
          "time": 186.5
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 2.3228,
          "tokens": null,
          "time": 111.7
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 0.9497,
          "tokens": null,
          "time": 103.5
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 0.478,
          "tokens": null,
          "time": 177.2
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 0.5367,
          "tokens": null,
          "time": 116.0
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": true,
          "cost": 3.0801,
          "tokens": null,
          "time": 133.3
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": false,
          "cost": 0.7253,
          "tokens": null,
          "time": 101.2
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 0.0001,
          "tokens": null,
          "time": 74.7
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": false,
          "cost": 1.3615,
          "tokens": null,
          "time": 106.3
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": true,
          "cost": 0.4332,
          "tokens": null,
          "time": 96.0
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": true,
          "cost": 1.4187,
          "tokens": null,
          "time": 186.6
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": false,
          "cost": 3.1208,
          "tokens": null,
          "time": 176.6
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": true,
          "cost": 0.3421,
          "tokens": null,
          "time": 68.2
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": false,
          "cost": 0.7803,
          "tokens": null,
          "time": 134.0
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": false,
          "cost": 1.2554,
          "tokens": null,
          "time": 116.0
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 2.4964,
          "tokens": null,
          "time": 142.6
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 1.8479,
          "tokens": null,
          "time": 155.4
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": true,
          "cost": 0.1043,
          "tokens": null,
          "time": 70.4
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": true,
          "cost": 0.2296,
          "tokens": null,
          "time": 82.1
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": true,
          "cost": 0.5569,
          "tokens": null,
          "time": 83.4
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": true,
          "cost": 0.7092,
          "tokens": null,
          "time": 114.6
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 1.4007,
          "tokens": null,
          "time": 136.9
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": false,
          "cost": 0.8837,
          "tokens": null,
          "time": 99.8
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 2.3403,
          "tokens": null,
          "time": 148.6
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": false,
          "cost": 3.9337,
          "tokens": null,
          "time": 236.2
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": true,
          "cost": 0.9422,
          "tokens": null,
          "time": 131.8
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": true,
          "cost": 1.073,
          "tokens": null,
          "time": 82.4
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": false,
          "cost": 2.0523,
          "tokens": null,
          "time": 206.9
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": false,
          "cost": 0.5888,
          "tokens": null,
          "time": 167.6
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": true,
          "cost": 3.8057,
          "tokens": null,
          "time": 163.7
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": false,
          "cost": 1.4892,
          "tokens": null,
          "time": 139.9
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 10.7686,
          "tokens": null,
          "time": 410.1
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 2.1739,
          "tokens": null,
          "time": 145.9
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 5.1449,
          "tokens": null,
          "time": 222.7
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": false,
          "cost": 3.9634,
          "tokens": null,
          "time": 213.7
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": false,
          "cost": 1.847,
          "tokens": null,
          "time": 143.7
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": true,
          "cost": 2.0792,
          "tokens": null,
          "time": 175.1
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 3.0044,
          "tokens": null,
          "time": 161.4
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": true,
          "cost": 3.2011,
          "tokens": null,
          "time": 178.0
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": false,
          "cost": 2.967,
          "tokens": null,
          "time": 119.0
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": false,
          "cost": 2.5398,
          "tokens": null,
          "time": 114.3
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": false,
          "cost": 1.2951,
          "tokens": null,
          "time": 206.4
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 1.4478,
          "tokens": null,
          "time": 105.8
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": true,
          "cost": 2.4247,
          "tokens": null,
          "time": 115.3
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": true,
          "cost": 0.8927,
          "tokens": null,
          "time": 86.0
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": true,
          "cost": 1.2814,
          "tokens": null,
          "time": 74.7
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": true,
          "cost": 2.0155,
          "tokens": null,
          "time": 117.3
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": true,
          "cost": 4.7491,
          "tokens": null,
          "time": 165.7
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 1.0321,
          "tokens": null,
          "time": 113.3
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 2.4258,
          "tokens": null,
          "time": 161.5
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.6608,
          "tokens": null,
          "time": 83.4
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": false,
          "cost": 0.776,
          "tokens": null,
          "time": 80.9
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": false,
          "cost": 1.2717,
          "tokens": null,
          "time": 93.9
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": false,
          "cost": 1.1247,
          "tokens": null,
          "time": 105.4
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": false,
          "cost": 0.6652,
          "tokens": null,
          "time": 98.4
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": true,
          "cost": 2.9075,
          "tokens": null,
          "time": 120.6
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": true,
          "cost": 1.1224,
          "tokens": null,
          "time": 123.4
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 0.7064,
          "tokens": null,
          "time": 99.4
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": true,
          "cost": 2.5444,
          "tokens": null,
          "time": 182.7
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": false,
          "cost": 2.6948,
          "tokens": null,
          "time": 159.6
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": true,
          "cost": 4.7804,
          "tokens": null,
          "time": 239.1
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": false,
          "cost": 1.0181,
          "tokens": null,
          "time": 106.3
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 0.7321,
          "tokens": null,
          "time": 86.9
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": true,
          "cost": 0.9565,
          "tokens": null,
          "time": 105.8
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 1.1604,
          "tokens": null,
          "time": 103.6
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 0.7968,
          "tokens": null,
          "time": 96.9
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 0.0595,
          "tokens": null,
          "time": 65.3
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": true,
          "cost": 2.8707,
          "tokens": null,
          "time": 184.7
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": true,
          "cost": 1.1311,
          "tokens": null,
          "time": 133.7
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 0.4056,
          "tokens": null,
          "time": 77.3
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": false,
          "cost": 2.5371,
          "tokens": null,
          "time": 171.1
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": false,
          "cost": 0.3287,
          "tokens": null,
          "time": 93.2
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": true,
          "cost": 1.1345,
          "tokens": null,
          "time": 132.4
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 2.5369,
          "tokens": null,
          "time": 183.3
        }
      ]
    },
    {
      "runKey": "hermes-opus-4.8",
      "harness": "hermes",
      "model": "claude-opus-4.8",
      "modelName": "claude-opus-4.8",
      "reported": {
        "cost": 1.095,
        "tokens": 207000,
        "time": 147,
        "tokensEstimated": true
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": false,
          "cost": 0.6135,
          "tokens": null,
          "time": 114.5
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": false,
          "cost": 1.0583,
          "tokens": null,
          "time": 100.3
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": false,
          "cost": 0.9902,
          "tokens": null,
          "time": 195.1
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": false,
          "cost": 1.0495,
          "tokens": null,
          "time": 167.0
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": true,
          "cost": 1.2328,
          "tokens": null,
          "time": 144.7
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": true,
          "cost": 0.7,
          "tokens": null,
          "time": 138.6
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": false,
          "cost": 1.1082,
          "tokens": null,
          "time": 150.9
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": true,
          "cost": 0.8009,
          "tokens": null,
          "time": 144.6
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": false,
          "cost": 1.17,
          "tokens": null,
          "time": 150.9
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": true,
          "cost": 0.8264,
          "tokens": null,
          "time": 113.2
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": false,
          "cost": 0.5936,
          "tokens": null,
          "time": 131.3
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": true,
          "cost": 1.3301,
          "tokens": null,
          "time": 154.6
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": false,
          "cost": 1.053,
          "tokens": null,
          "time": 121.5
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": false,
          "cost": 0.7742,
          "tokens": null,
          "time": 127.2
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": true,
          "cost": 1.1485,
          "tokens": null,
          "time": 137.2
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": false,
          "cost": 0.9527,
          "tokens": null,
          "time": 132.7
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": true,
          "cost": 0.7743,
          "tokens": null,
          "time": 123.0
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": true,
          "cost": 1.5332,
          "tokens": null,
          "time": 169.4
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": false,
          "cost": 0.716,
          "tokens": null,
          "time": 109.1
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": false,
          "cost": 0.6484,
          "tokens": null,
          "time": 115.9
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 0.5901,
          "tokens": null,
          "time": 263.7
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": false,
          "cost": 0.7872,
          "tokens": null,
          "time": 148.8
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 1.9349,
          "tokens": null,
          "time": 205.6
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 0.7583,
          "tokens": null,
          "time": 129.1
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": true,
          "cost": 1.2706,
          "tokens": null,
          "time": 153.0
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 1.4762,
          "tokens": null,
          "time": 176.6
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 1.1017,
          "tokens": null,
          "time": 127.3
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 0.4534,
          "tokens": null,
          "time": 108.0
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 1.667,
          "tokens": null,
          "time": 169.6
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 1.3382,
          "tokens": null,
          "time": 120.5
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": true,
          "cost": 0.9377,
          "tokens": null,
          "time": 181.2
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": true,
          "cost": 2.6081,
          "tokens": null,
          "time": 167.4
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": false,
          "cost": 1.514,
          "tokens": null,
          "time": 204.2
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": false,
          "cost": 1.5006,
          "tokens": null,
          "time": 130.3
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 0.9418,
          "tokens": null,
          "time": 158.9
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": true,
          "cost": 0.9719,
          "tokens": null,
          "time": 109.0
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 1.2444,
          "tokens": null,
          "time": 147.6
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 1.8902,
          "tokens": null,
          "time": 235.6
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": false,
          "cost": 2.3713,
          "tokens": null,
          "time": 238.4
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 0.945,
          "tokens": null,
          "time": 185.4
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": false,
          "cost": 0.8798,
          "tokens": null,
          "time": 133.2
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 0.9434,
          "tokens": null,
          "time": 146.0
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": false,
          "cost": 0.8607,
          "tokens": null,
          "time": 142.6
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": false,
          "cost": 1.5023,
          "tokens": null,
          "time": 152.2
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": false,
          "cost": 0.7848,
          "tokens": null,
          "time": 113.5
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 2.1201,
          "tokens": null,
          "time": 248.6
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": false,
          "cost": 0.7245,
          "tokens": null,
          "time": 151.5
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": true,
          "cost": 1.1885,
          "tokens": null,
          "time": 105.7
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": true,
          "cost": 2.6988,
          "tokens": null,
          "time": 189.4
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": true,
          "cost": 0.9717,
          "tokens": null,
          "time": 178.1
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": false,
          "cost": 1.1394,
          "tokens": null,
          "time": 159.5
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": true,
          "cost": 1.8212,
          "tokens": null,
          "time": 195.6
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": true,
          "cost": 0.9672,
          "tokens": null,
          "time": 160.4
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": true,
          "cost": 1.4906,
          "tokens": null,
          "time": 217.0
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 1.4804,
          "tokens": null,
          "time": 159.7
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 1.1454,
          "tokens": null,
          "time": 184.1
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 0.8386,
          "tokens": null,
          "time": 89.2
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": true,
          "cost": 0.9234,
          "tokens": null,
          "time": 152.7
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 1.4248,
          "tokens": null,
          "time": 155.9
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": true,
          "cost": 0.8459,
          "tokens": null,
          "time": 130.0
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": true,
          "cost": 0.8595,
          "tokens": null,
          "time": 114.8
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 0.7384,
          "tokens": null,
          "time": 120.2
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": false,
          "cost": 0.5725,
          "tokens": null,
          "time": 111.4
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": false,
          "cost": 0.8339,
          "tokens": null,
          "time": 118.9
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": false,
          "cost": 1.453,
          "tokens": null,
          "time": 227.5
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": true,
          "cost": 1.564,
          "tokens": null,
          "time": 149.7
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": true,
          "cost": 2.9834,
          "tokens": null,
          "time": 248.6
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": true,
          "cost": 1.3985,
          "tokens": null,
          "time": 161.7
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": true,
          "cost": 0.7162,
          "tokens": null,
          "time": 138.9
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": true,
          "cost": 1.0691,
          "tokens": null,
          "time": 113.5
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": true,
          "cost": 1.658,
          "tokens": null,
          "time": 154.8
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": true,
          "cost": 2.0937,
          "tokens": null,
          "time": 254.5
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 1.1681,
          "tokens": null,
          "time": 143.7
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": true,
          "cost": 1.383,
          "tokens": null,
          "time": 155.1
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": false,
          "cost": 0.728,
          "tokens": null,
          "time": 160.2
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": false,
          "cost": 0.5714,
          "tokens": null,
          "time": 141.4
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 0.9803,
          "tokens": null,
          "time": 124.8
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": false,
          "cost": 0.8175,
          "tokens": null,
          "time": 125.5
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 0.9707,
          "tokens": null,
          "time": 98.5
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 1.1107,
          "tokens": null,
          "time": 140.4
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.7041,
          "tokens": null,
          "time": 111.0
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": false,
          "cost": 1.7507,
          "tokens": null,
          "time": 162.6
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": true,
          "cost": 1.1308,
          "tokens": null,
          "time": 122.1
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": false,
          "cost": 0.53,
          "tokens": null,
          "time": 124.6
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": false,
          "cost": 0.592,
          "tokens": null,
          "time": 120.1
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": false,
          "cost": 0.6798,
          "tokens": null,
          "time": 123.5
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": false,
          "cost": 1.4326,
          "tokens": null,
          "time": 184.0
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 0.6386,
          "tokens": null,
          "time": 157.2
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": true,
          "cost": 1.4594,
          "tokens": null,
          "time": 176.0
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": false,
          "cost": 1.4499,
          "tokens": null,
          "time": 142.4
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": false,
          "cost": 1.2171,
          "tokens": null,
          "time": 150.4
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 0.905,
          "tokens": null,
          "time": 146.4
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": false,
          "cost": 0.644,
          "tokens": null,
          "time": 102.9
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": false,
          "cost": 0.7765,
          "tokens": null,
          "time": 114.0
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": false,
          "cost": 0.9558,
          "tokens": null,
          "time": 124.1
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": true,
          "cost": 1.2684,
          "tokens": null,
          "time": 135.7
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": false,
          "cost": 1.3043,
          "tokens": null,
          "time": 129.5
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": false,
          "cost": 1.633,
          "tokens": null,
          "time": 132.3
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": true,
          "cost": 0.8521,
          "tokens": null,
          "time": 134.0
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": false,
          "cost": 1.2047,
          "tokens": null,
          "time": 172.6
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": true,
          "cost": 2.0861,
          "tokens": null,
          "time": 117.1
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": false,
          "cost": 1.5994,
          "tokens": null,
          "time": 216.8
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": false,
          "cost": 0.4217,
          "tokens": null,
          "time": 126.5
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": false,
          "cost": 1.2156,
          "tokens": null,
          "time": 116.7
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": false,
          "cost": 1.648,
          "tokens": null,
          "time": 149.4
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": false,
          "cost": 2.1752,
          "tokens": null,
          "time": 199.7
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": true,
          "cost": 1.9235,
          "tokens": null,
          "time": 140.4
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": false,
          "cost": 1.8786,
          "tokens": null,
          "time": 195.0
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": false,
          "cost": 1.1544,
          "tokens": null,
          "time": 153.5
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": false,
          "cost": 0.8124,
          "tokens": null,
          "time": 138.7
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": true,
          "cost": 1.4495,
          "tokens": null,
          "time": 137.5
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": false,
          "cost": 1.0774,
          "tokens": null,
          "time": 153.3
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": false,
          "cost": 0.8011,
          "tokens": null,
          "time": 141.9
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": true,
          "cost": 0.5498,
          "tokens": null,
          "time": 92.1
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": true,
          "cost": 1.0181,
          "tokens": null,
          "time": 125.7
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": false,
          "cost": 1.0165,
          "tokens": null,
          "time": 125.4
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": false,
          "cost": 0.5737,
          "tokens": null,
          "time": 120.0
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": false,
          "cost": 0.8066,
          "tokens": null,
          "time": 182.9
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": false,
          "cost": 0.79,
          "tokens": null,
          "time": 119.1
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": true,
          "cost": 0.575,
          "tokens": null,
          "time": 126.1
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": false,
          "cost": 1.0233,
          "tokens": null,
          "time": 178.3
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": true,
          "cost": 0.6106,
          "tokens": null,
          "time": 124.6
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 4.4909,
          "tokens": null,
          "time": 225.6
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 0.9919,
          "tokens": null,
          "time": 109.3
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 0.9008,
          "tokens": null,
          "time": 85.9
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 0.7668,
          "tokens": null,
          "time": 190.2
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": true,
          "cost": 0.767,
          "tokens": null,
          "time": 176.6
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": false,
          "cost": 1.39,
          "tokens": null,
          "time": 171.2
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 0.9693,
          "tokens": null,
          "time": 113.7
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": true,
          "cost": 0.8426,
          "tokens": null,
          "time": 123.1
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": false,
          "cost": 1.0408,
          "tokens": null,
          "time": 127.4
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": false,
          "cost": 0.649,
          "tokens": null,
          "time": 90.7
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": true,
          "cost": 0.7961,
          "tokens": null,
          "time": 98.6
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": false,
          "cost": 1.0347,
          "tokens": null,
          "time": 136.5
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": true,
          "cost": 1.2717,
          "tokens": null,
          "time": 146.0
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": false,
          "cost": 0.7593,
          "tokens": null,
          "time": 179.4
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 1.7668,
          "tokens": null,
          "time": 184.1
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 1.1489,
          "tokens": null,
          "time": 160.1
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": true,
          "cost": 0.8673,
          "tokens": null,
          "time": 117.3
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": false,
          "cost": 1.3056,
          "tokens": null,
          "time": 164.8
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": true,
          "cost": 0.6195,
          "tokens": null,
          "time": 94.9
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": true,
          "cost": 0.7686,
          "tokens": null,
          "time": 100.6
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 0.8929,
          "tokens": null,
          "time": 126.2
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": false,
          "cost": 1.212,
          "tokens": null,
          "time": 150.4
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 0.5933,
          "tokens": null,
          "time": 141.2
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": false,
          "cost": 2.5467,
          "tokens": null,
          "time": 264.8
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": true,
          "cost": 1.3485,
          "tokens": null,
          "time": 243.9
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": false,
          "cost": 0.7778,
          "tokens": null,
          "time": 137.0
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": false,
          "cost": 1.1529,
          "tokens": null,
          "time": 159.4
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": false,
          "cost": 1.3661,
          "tokens": null,
          "time": 193.8
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": true,
          "cost": 0.6983,
          "tokens": null,
          "time": 128.3
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": false,
          "cost": 0.5985,
          "tokens": null,
          "time": 143.1
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 0.7112,
          "tokens": null,
          "time": 184.7
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 1.097,
          "tokens": null,
          "time": 134.5
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 1.7551,
          "tokens": null,
          "time": 160.6
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": true,
          "cost": 0.9007,
          "tokens": null,
          "time": 112.3
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": false,
          "cost": 1.0069,
          "tokens": null,
          "time": 178.3
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": false,
          "cost": 0.933,
          "tokens": null,
          "time": 139.6
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 1.5584,
          "tokens": null,
          "time": 162.1
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": true,
          "cost": 1.3641,
          "tokens": null,
          "time": 149.8
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": false,
          "cost": 0.8117,
          "tokens": null,
          "time": 144.9
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": false,
          "cost": 0.6462,
          "tokens": null,
          "time": 141.0
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": false,
          "cost": 0.5984,
          "tokens": null,
          "time": 130.5
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 0.6988,
          "tokens": null,
          "time": 135.4
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": false,
          "cost": 0.7616,
          "tokens": null,
          "time": 121.9
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": false,
          "cost": 0.6314,
          "tokens": null,
          "time": 125.4
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": true,
          "cost": 0.8492,
          "tokens": null,
          "time": 109.4
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": false,
          "cost": 1.1781,
          "tokens": null,
          "time": 152.1
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": false,
          "cost": 0.511,
          "tokens": null,
          "time": 116.7
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 0.5017,
          "tokens": null,
          "time": 127.6
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 1.0516,
          "tokens": null,
          "time": 143.2
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.843,
          "tokens": null,
          "time": 136.1
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": false,
          "cost": 0.8292,
          "tokens": null,
          "time": 127.3
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": false,
          "cost": 0.6814,
          "tokens": null,
          "time": 169.4
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": false,
          "cost": 0.6263,
          "tokens": null,
          "time": 129.0
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": true,
          "cost": 0.6637,
          "tokens": null,
          "time": 108.1
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": true,
          "cost": 0.8827,
          "tokens": null,
          "time": 140.7
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": false,
          "cost": 0.9538,
          "tokens": null,
          "time": 137.5
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 1.2015,
          "tokens": null,
          "time": 143.3
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": true,
          "cost": 1.1871,
          "tokens": null,
          "time": 119.5
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": true,
          "cost": 0.8278,
          "tokens": null,
          "time": 152.4
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": true,
          "cost": 0.9389,
          "tokens": null,
          "time": 147.2
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": false,
          "cost": 0.9565,
          "tokens": null,
          "time": 131.1
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": true,
          "cost": 0.8283,
          "tokens": null,
          "time": 124.2
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": true,
          "cost": 1.1656,
          "tokens": null,
          "time": 164.5
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 0.5227,
          "tokens": null,
          "time": 116.3
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 0.6175,
          "tokens": null,
          "time": 118.3
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 0.8449,
          "tokens": null,
          "time": 171.9
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": false,
          "cost": 1.3025,
          "tokens": null,
          "time": 145.3
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": false,
          "cost": 0.8362,
          "tokens": null,
          "time": 158.7
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 1.5752,
          "tokens": null,
          "time": 180.4
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": false,
          "cost": 0.6223,
          "tokens": null,
          "time": 104.9
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": false,
          "cost": 1.0268,
          "tokens": null,
          "time": 114.0
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 0.449,
          "tokens": null,
          "time": 130.3
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 1.126,
          "tokens": null,
          "time": 146.8
        }
      ]
    },
    {
      "runKey": "rag-sonnet-4.5",
      "harness": "trace-rag",
      "model": "claude-sonnet-4.5",
      "modelName": "claude-sonnet-4.5",
      "reported": {
        "cost": 0.529,
        "tokens": 169000,
        "time": 155,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": false,
          "cost": 0.5037,
          "tokens": 162014,
          "time": 99.8
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": false,
          "cost": 0.559,
          "tokens": 180636,
          "time": 103.8
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": false,
          "cost": 1.7064,
          "tokens": 557690,
          "time": 216.8
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": false,
          "cost": 1.2718,
          "tokens": 414358,
          "time": 130.2
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": false,
          "cost": 0.7645,
          "tokens": 245018,
          "time": 184.5
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": true,
          "cost": 0.7507,
          "tokens": 240432,
          "time": 184.4
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": true,
          "cost": 0.8157,
          "tokens": 264189,
          "time": 163.8
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": true,
          "cost": 0.5127,
          "tokens": 164227,
          "time": 112.0
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": true,
          "cost": 0.4303,
          "tokens": 136522,
          "time": 103.4
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": true,
          "cost": 0.3371,
          "tokens": 107797,
          "time": 82.1
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": false,
          "cost": 0.2944,
          "tokens": 92925,
          "time": 107.4
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": false,
          "cost": 0.9747,
          "tokens": 316501,
          "time": 139.2
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": false,
          "cost": 0.5029,
          "tokens": 159326,
          "time": 114.8
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": false,
          "cost": 0.4941,
          "tokens": 156208,
          "time": 196.5
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": false,
          "cost": 0.6306,
          "tokens": 202938,
          "time": 105.2
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": false,
          "cost": 0.6245,
          "tokens": 199356,
          "time": 122.3
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 0.3626,
          "tokens": 113518,
          "time": 300.4
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": false,
          "cost": 0.2089,
          "tokens": 64000,
          "time": 140.1
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": false,
          "cost": 0.35,
          "tokens": 111956,
          "time": 238.8
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": false,
          "cost": 0.3773,
          "tokens": 120618,
          "time": 297.3
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 0.6448,
          "tokens": 207796,
          "time": 184.5
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": false,
          "cost": 1.0236,
          "tokens": 326546,
          "time": 297.0
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 0.5516,
          "tokens": 176220,
          "time": 228.4
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 0.5042,
          "tokens": 162461,
          "time": 205.5
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": false,
          "cost": 0.8058,
          "tokens": 261283,
          "time": 266.2
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 0.6835,
          "tokens": 218108,
          "time": 308.0
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 0.2355,
          "tokens": 73116,
          "time": 326.4
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 0.2786,
          "tokens": 87554,
          "time": 325.9
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 0.7522,
          "tokens": 238537,
          "time": 308.6
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 0.2785,
          "tokens": 86739,
          "time": 184.8
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": true,
          "cost": 0.2867,
          "tokens": 88746,
          "time": 181.3
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": false,
          "cost": 0.4715,
          "tokens": 151581,
          "time": 248.5
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": false,
          "cost": 1.2794,
          "tokens": 416358,
          "time": 291.7
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": false,
          "cost": 0.6072,
          "tokens": 195656,
          "time": 261.9
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 0.6417,
          "tokens": 207690,
          "time": 263.7
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": false,
          "cost": 0.2205,
          "tokens": 68711,
          "time": 154.2
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 0.3384,
          "tokens": 106649,
          "time": 156.6
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 0.4923,
          "tokens": 143897,
          "time": 253.2
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": true,
          "cost": 0.5591,
          "tokens": 160387,
          "time": 334.9
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 0.9496,
          "tokens": 295543,
          "time": 305.2
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": false,
          "cost": 0.279,
          "tokens": 86938,
          "time": 156.4
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 0.4516,
          "tokens": 143257,
          "time": 307.5
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": true,
          "cost": 0.2903,
          "tokens": 84842,
          "time": 225.8
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": false,
          "cost": 0.3359,
          "tokens": 106077,
          "time": 173.2
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": false,
          "cost": 0.4358,
          "tokens": 138889,
          "time": 222.3
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 0.3462,
          "tokens": 109821,
          "time": 100.4
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": false,
          "cost": 0.3372,
          "tokens": 106973,
          "time": 90.2
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": false,
          "cost": 0.3783,
          "tokens": 119644,
          "time": 121.8
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": false,
          "cost": 0.8356,
          "tokens": 273333,
          "time": 110.1
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": false,
          "cost": 0.691,
          "tokens": 221600,
          "time": 192.3
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": false,
          "cost": 0.7242,
          "tokens": 233689,
          "time": 119.3
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": false,
          "cost": 0.7803,
          "tokens": 254383,
          "time": 172.1
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": true,
          "cost": 0.438,
          "tokens": 140279,
          "time": 113.8
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": false,
          "cost": 0.5833,
          "tokens": 188136,
          "time": 119.3
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 0.2625,
          "tokens": 82131,
          "time": 100.5
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 0.4614,
          "tokens": 146888,
          "time": 126.2
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 0.1147,
          "tokens": 34781,
          "time": 97.4
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": true,
          "cost": 1.0422,
          "tokens": 336593,
          "time": 139.5
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 0.655,
          "tokens": 211774,
          "time": 115.5
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": true,
          "cost": 0.2272,
          "tokens": 71282,
          "time": 129.3
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": true,
          "cost": 0.1696,
          "tokens": 51355,
          "time": 130.0
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": false,
          "cost": 0.1961,
          "tokens": 59956,
          "time": 327.0
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": true,
          "cost": 0.5177,
          "tokens": 164137,
          "time": 382.8
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": true,
          "cost": 0.8355,
          "tokens": 268793,
          "time": 367.9
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": false,
          "cost": 1.369,
          "tokens": 448965,
          "time": 238.9
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": false,
          "cost": 0.2947,
          "tokens": 92846,
          "time": 336.8
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": true,
          "cost": 0.5348,
          "tokens": 170715,
          "time": 308.7
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": false,
          "cost": 1.021,
          "tokens": 334824,
          "time": 369.8
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": false,
          "cost": 1.347,
          "tokens": 443450,
          "time": 357.5
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": false,
          "cost": 0.257,
          "tokens": 80339,
          "time": 204.4
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": false,
          "cost": 0.9011,
          "tokens": 293237,
          "time": 384.7
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": false,
          "cost": 1.3922,
          "tokens": 454016,
          "time": 346.0
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 0.2025,
          "tokens": 62006,
          "time": 225.9
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 0.4779,
          "tokens": 150673,
          "time": 202.1
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": true,
          "cost": 0.3521,
          "tokens": 110742,
          "time": 183.9
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": false,
          "cost": 0.8229,
          "tokens": 265743,
          "time": 311.2
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 0.4991,
          "tokens": 159931,
          "time": 164.3
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": false,
          "cost": 0.6008,
          "tokens": 192674,
          "time": 193.8
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 0.3204,
          "tokens": 100265,
          "time": 232.3
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 0.1657,
          "tokens": 50523,
          "time": 172.3
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.2174,
          "tokens": 67495,
          "time": 148.4
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": false,
          "cost": 0.8036,
          "tokens": 262039,
          "time": 263.7
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": true,
          "cost": 0.1678,
          "tokens": 51035,
          "time": 248.6
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": true,
          "cost": 0.2575,
          "tokens": 80881,
          "time": 83.0
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": true,
          "cost": 0.4861,
          "tokens": 155417,
          "time": 121.0
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": true,
          "cost": 0.3446,
          "tokens": 109361,
          "time": 139.4
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": true,
          "cost": 0.4201,
          "tokens": 133384,
          "time": 107.9
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 0.622,
          "tokens": 200688,
          "time": 164.5
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": true,
          "cost": 0.3456,
          "tokens": 104708,
          "time": 154.6
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": true,
          "cost": 0.1714,
          "tokens": 51187,
          "time": 127.9
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": true,
          "cost": 0.2216,
          "tokens": 68599,
          "time": 155.2
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 0.2956,
          "tokens": 92781,
          "time": 180.9
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": true,
          "cost": 0.2343,
          "tokens": 73975,
          "time": 126.9
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": true,
          "cost": 0.4542,
          "tokens": 146041,
          "time": 167.9
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": true,
          "cost": 0.2393,
          "tokens": 74382,
          "time": 182.2
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": false,
          "cost": 0.4219,
          "tokens": 133099,
          "time": 194.7
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": true,
          "cost": 0.1207,
          "tokens": 35522,
          "time": 168.4
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": false,
          "cost": 0.5665,
          "tokens": 180627,
          "time": 177.7
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": false,
          "cost": 0.5392,
          "tokens": 172746,
          "time": 184.0
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": false,
          "cost": 0.4798,
          "tokens": 153731,
          "time": 184.0
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": false,
          "cost": 1.2475,
          "tokens": 410137,
          "time": 220.3
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": true,
          "cost": 0.5335,
          "tokens": 170119,
          "time": 246.9
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": false,
          "cost": 1.1871,
          "tokens": 389410,
          "time": 228.0
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": false,
          "cost": 0.9424,
          "tokens": 307745,
          "time": 91.8
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": false,
          "cost": 0.4389,
          "tokens": 139209,
          "time": 82.3
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": false,
          "cost": 0.6031,
          "tokens": 193838,
          "time": 94.3
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": false,
          "cost": 0.782,
          "tokens": 255049,
          "time": 193.5
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": true,
          "cost": 1.5656,
          "tokens": 514209,
          "time": 253.3
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": true,
          "cost": 0.2151,
          "tokens": 66857,
          "time": 226.7
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": true,
          "cost": 0.2954,
          "tokens": 92461,
          "time": 230.0
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": false,
          "cost": 0.4428,
          "tokens": 142780,
          "time": 161.6
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": false,
          "cost": 0.4368,
          "tokens": 139127,
          "time": 187.0
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": true,
          "cost": 0.8104,
          "tokens": 262429,
          "time": 181.2
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": true,
          "cost": 0.2255,
          "tokens": 70455,
          "time": 144.7
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": true,
          "cost": 0.2669,
          "tokens": 83086,
          "time": 161.5
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": false,
          "cost": 0.4322,
          "tokens": 137121,
          "time": 166.6
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": false,
          "cost": 0.7972,
          "tokens": 258829,
          "time": 159.2
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": false,
          "cost": 1.2985,
          "tokens": 423470,
          "time": 93.6
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": false,
          "cost": 0.2363,
          "tokens": 73060,
          "time": 154.3
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": false,
          "cost": 0.4449,
          "tokens": 142941,
          "time": 155.2
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": true,
          "cost": 0.2295,
          "tokens": 71392,
          "time": 128.1
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": true,
          "cost": 0.4847,
          "tokens": 155572,
          "time": 69.5
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 0.5083,
          "tokens": 163487,
          "time": 137.4
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 0.2081,
          "tokens": 65078,
          "time": 137.1
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 0.1513,
          "tokens": 46153,
          "time": 137.1
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 0.4489,
          "tokens": 143857,
          "time": 147.8
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": false,
          "cost": 0.6631,
          "tokens": 214927,
          "time": 72.3
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": true,
          "cost": 0.293,
          "tokens": 92602,
          "time": 147.1
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 0.1645,
          "tokens": 50591,
          "time": 52.9
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": true,
          "cost": 0.2615,
          "tokens": 81718,
          "time": 163.9
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": false,
          "cost": 0.5535,
          "tokens": 176871,
          "time": 181.7
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": false,
          "cost": 0.234,
          "tokens": 73812,
          "time": 147.5
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": true,
          "cost": 0.3392,
          "tokens": 106641,
          "time": 146.9
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": false,
          "cost": 0.1809,
          "tokens": 55454,
          "time": 57.5
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": false,
          "cost": 0.2476,
          "tokens": 76813,
          "time": 146.1
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": false,
          "cost": 0.2502,
          "tokens": 78731,
          "time": 133.6
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 0.2859,
          "tokens": 89416,
          "time": 132.5
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 0.4479,
          "tokens": 142682,
          "time": 61.8
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": false,
          "cost": 0.2213,
          "tokens": 69124,
          "time": 59.9
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": true,
          "cost": 0.3225,
          "tokens": 101962,
          "time": 59.5
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": true,
          "cost": 0.2353,
          "tokens": 73457,
          "time": 119.5
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": true,
          "cost": 0.5894,
          "tokens": 185910,
          "time": 159.7
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 0.5124,
          "tokens": 163996,
          "time": 140.4
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": false,
          "cost": 0.3242,
          "tokens": 102964,
          "time": 119.0
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 0.3295,
          "tokens": 104723,
          "time": 59.9
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": false,
          "cost": 0.8535,
          "tokens": 276564,
          "time": 99.5
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": false,
          "cost": 0.6334,
          "tokens": 205730,
          "time": 87.0
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": false,
          "cost": 0.7539,
          "tokens": 243470,
          "time": 97.2
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": false,
          "cost": 1.0968,
          "tokens": 352436,
          "time": 125.5
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": true,
          "cost": 0.3782,
          "tokens": 112424,
          "time": 116.5
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": false,
          "cost": 0.9977,
          "tokens": 325095,
          "time": 96.9
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": false,
          "cost": 0.3369,
          "tokens": 105969,
          "time": 85.4
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 0.8699,
          "tokens": 282567,
          "time": 93.1
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 0.453,
          "tokens": 143544,
          "time": 103.1
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 1.2022,
          "tokens": 392022,
          "time": 106.7
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": false,
          "cost": 0.7693,
          "tokens": 250187,
          "time": 87.7
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": true,
          "cost": 0.8567,
          "tokens": 277975,
          "time": 98.7
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": false,
          "cost": 0.4354,
          "tokens": 139691,
          "time": 88.9
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 1.0907,
          "tokens": 353703,
          "time": 118.2
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": true,
          "cost": 0.3796,
          "tokens": 121158,
          "time": 69.9
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": true,
          "cost": 0.8416,
          "tokens": 273332,
          "time": 86.0
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": false,
          "cost": 0.7826,
          "tokens": 253917,
          "time": 85.9
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": false,
          "cost": 1.161,
          "tokens": 372696,
          "time": 121.9
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 0.737,
          "tokens": 236079,
          "time": 106.0
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": true,
          "cost": 0.3745,
          "tokens": 119302,
          "time": 73.6
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": false,
          "cost": 0.6119,
          "tokens": 195001,
          "time": 82.2
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": true,
          "cost": 0.1786,
          "tokens": 55113,
          "time": 59.9
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": true,
          "cost": 0.6431,
          "tokens": 206694,
          "time": 84.3
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": false,
          "cost": 1.1935,
          "tokens": 387723,
          "time": 114.0
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 0.1641,
          "tokens": 50905,
          "time": 68.3
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 0.4107,
          "tokens": 129656,
          "time": 75.9
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.1322,
          "tokens": 39320,
          "time": 58.5
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": false,
          "cost": 0.3308,
          "tokens": 103488,
          "time": 70.9
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": false,
          "cost": 0.3126,
          "tokens": 98584,
          "time": 69.5
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": true,
          "cost": 0.7296,
          "tokens": 235417,
          "time": 86.0
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": true,
          "cost": 0.2591,
          "tokens": 80676,
          "time": 58.9
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": true,
          "cost": 0.1612,
          "tokens": 49533,
          "time": 47.0
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": true,
          "cost": 0.3244,
          "tokens": 102454,
          "time": 57.1
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 0.6033,
          "tokens": 195112,
          "time": 58.9
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": false,
          "cost": 0.5577,
          "tokens": 176633,
          "time": 79.8
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": false,
          "cost": 0.5824,
          "tokens": 185401,
          "time": 79.2
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": true,
          "cost": 0.7252,
          "tokens": 232137,
          "time": 88.7
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": false,
          "cost": 0.8327,
          "tokens": 269252,
          "time": 83.0
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 0.264,
          "tokens": 83306,
          "time": 58.6
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": false,
          "cost": 0.2414,
          "tokens": 74947,
          "time": 73.5
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 0.2218,
          "tokens": 69198,
          "time": 61.3
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 0.2872,
          "tokens": 89324,
          "time": 64.3
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 0.2114,
          "tokens": 65067,
          "time": 56.6
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": false,
          "cost": 0.7952,
          "tokens": 257389,
          "time": 84.0
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": false,
          "cost": 0.5336,
          "tokens": 171224,
          "time": 63.1
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 0.2294,
          "tokens": 70516,
          "time": 63.2
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": false,
          "cost": 0.5264,
          "tokens": 168727,
          "time": 65.3
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": false,
          "cost": 0.3098,
          "tokens": 98218,
          "time": 58.8
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 0.3038,
          "tokens": 95399,
          "time": 65.5
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 0.4206,
          "tokens": 133478,
          "time": 61.1
        }
      ]
    },
    {
      "runKey": "rag-haiku-4.5",
      "harness": "trace-rag",
      "model": "claude-haiku-4.5",
      "modelName": "claude-haiku-4.5",
      "reported": {
        "cost": 0.189,
        "tokens": 181000,
        "time": 135,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": false,
          "cost": 0.1648,
          "tokens": 157772,
          "time": 99.8
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": false,
          "cost": 0.0857,
          "tokens": 80467,
          "time": 77.9
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": false,
          "cost": 0.2552,
          "tokens": 247627,
          "time": 72.0
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": false,
          "cost": 0.0921,
          "tokens": 85990,
          "time": 62.0
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": false,
          "cost": 0.313,
          "tokens": 304108,
          "time": 113.7
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": false,
          "cost": 0.2352,
          "tokens": 223506,
          "time": 204.5
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": false,
          "cost": 0.2801,
          "tokens": 271494,
          "time": 169.5
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": false,
          "cost": 0.1632,
          "tokens": 156857,
          "time": 102.6
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": true,
          "cost": 0.1556,
          "tokens": 146686,
          "time": 131.9
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": false,
          "cost": 0.2725,
          "tokens": 265908,
          "time": 71.5
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": true,
          "cost": 0.0913,
          "tokens": 86087,
          "time": 80.9
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": false,
          "cost": 0.2043,
          "tokens": 192119,
          "time": 98.5
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": false,
          "cost": 0.2538,
          "tokens": 245318,
          "time": 102.7
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": false,
          "cost": 0.1166,
          "tokens": 110635,
          "time": 74.1
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": false,
          "cost": 0.0909,
          "tokens": 85139,
          "time": 61.5
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": false,
          "cost": 0.2783,
          "tokens": 270152,
          "time": 66.6
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 0.1606,
          "tokens": 153006,
          "time": 300.7
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": false,
          "cost": 0.1149,
          "tokens": 109140,
          "time": 209.2
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": false,
          "cost": 0.3408,
          "tokens": 333543,
          "time": 219.6
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": false,
          "cost": 0.6888,
          "tokens": 679022,
          "time": 352.3
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 0.2952,
          "tokens": 285425,
          "time": 220.7
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": false,
          "cost": 0.2375,
          "tokens": 224020,
          "time": 218.2
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 0.0948,
          "tokens": 88243,
          "time": 150.7
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 0.0994,
          "tokens": 93585,
          "time": 200.2
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": false,
          "cost": 0.4285,
          "tokens": 414982,
          "time": 250.9
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 0.1038,
          "tokens": 94952,
          "time": 302.5
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 0.0804,
          "tokens": 74979,
          "time": 283.2
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 0.0797,
          "tokens": 74556,
          "time": 274.7
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 0.1571,
          "tokens": 145775,
          "time": 230.1
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 0.0807,
          "tokens": 75178,
          "time": 120.4
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": false,
          "cost": 0.1124,
          "tokens": 105226,
          "time": 304.6
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": true,
          "cost": 0.2433,
          "tokens": 235999,
          "time": 196.0
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": false,
          "cost": 0.2804,
          "tokens": 266574,
          "time": 201.0
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": false,
          "cost": 0.2934,
          "tokens": 283206,
          "time": 238.1
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 0.2143,
          "tokens": 205236,
          "time": 242.1
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": true,
          "cost": 0.1042,
          "tokens": 98303,
          "time": 149.8
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 0.4036,
          "tokens": 388270,
          "time": 266.2
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 0.2025,
          "tokens": 182868,
          "time": 247.1
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": false,
          "cost": 0.2089,
          "tokens": 189105,
          "time": 248.6
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 0.2693,
          "tokens": 237961,
          "time": 223.7
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": false,
          "cost": 0.1696,
          "tokens": 161626,
          "time": 202.1
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 0.1149,
          "tokens": 108154,
          "time": 193.9
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": true,
          "cost": 0.0871,
          "tokens": 76726,
          "time": 168.7
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": false,
          "cost": 0.1179,
          "tokens": 111136,
          "time": 218.6
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": false,
          "cost": 0.0837,
          "tokens": 78507,
          "time": 201.7
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 0.1534,
          "tokens": 146603,
          "time": 69.3
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": false,
          "cost": 0.1171,
          "tokens": 111925,
          "time": 81.0
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": false,
          "cost": 0.0997,
          "tokens": 94184,
          "time": 175.4
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": false,
          "cost": 0.5109,
          "tokens": 502704,
          "time": 109.5
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": false,
          "cost": 0.2339,
          "tokens": 226789,
          "time": 87.9
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": false,
          "cost": 0.1344,
          "tokens": 126741,
          "time": 191.5
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": false,
          "cost": 0.3431,
          "tokens": 336059,
          "time": 97.2
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": false,
          "cost": 0.1874,
          "tokens": 179609,
          "time": 110.7
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": true,
          "cost": 0.2928,
          "tokens": 284266,
          "time": 93.1
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 0.1281,
          "tokens": 121866,
          "time": 71.0
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 0.1182,
          "tokens": 112898,
          "time": 60.2
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 0.0748,
          "tokens": 70737,
          "time": 73.4
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": true,
          "cost": 0.0985,
          "tokens": 92146,
          "time": 91.5
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 0.13,
          "tokens": 122541,
          "time": 75.5
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": true,
          "cost": 0.0776,
          "tokens": 72527,
          "time": 104.7
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": false,
          "cost": 0.1467,
          "tokens": 138927,
          "time": 95.4
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 0.1731,
          "tokens": 165745,
          "time": 238.8
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": false,
          "cost": 0.4264,
          "tokens": 412906,
          "time": 249.8
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": false,
          "cost": 0.1952,
          "tokens": 186426,
          "time": 332.0
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": false,
          "cost": 0.353,
          "tokens": 343183,
          "time": 273.3
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": true,
          "cost": 0.1186,
          "tokens": 113390,
          "time": 247.4
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": true,
          "cost": 0.2546,
          "tokens": 245100,
          "time": 344.4
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": false,
          "cost": 0.4616,
          "tokens": 453100,
          "time": 252.6
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": false,
          "cost": 0.4665,
          "tokens": 459815,
          "time": 248.7
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": true,
          "cost": 0.1787,
          "tokens": 170952,
          "time": 232.8
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": false,
          "cost": 0.1962,
          "tokens": 190647,
          "time": 133.5
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": false,
          "cost": 0.2584,
          "tokens": 247130,
          "time": 202.9
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 0.0749,
          "tokens": 69855,
          "time": 203.4
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 0.1321,
          "tokens": 126150,
          "time": 261.5
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": true,
          "cost": 0.1425,
          "tokens": 134696,
          "time": 116.0
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": false,
          "cost": 0.23,
          "tokens": 221600,
          "time": 218.3
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 0.1708,
          "tokens": 163916,
          "time": 210.2
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": false,
          "cost": 0.0866,
          "tokens": 80054,
          "time": 150.8
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 0.1076,
          "tokens": 101151,
          "time": 196.1
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 0.113,
          "tokens": 108292,
          "time": 213.5
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.1217,
          "tokens": 116405,
          "time": 230.0
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": false,
          "cost": 0.4489,
          "tokens": 441754,
          "time": 249.5
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": true,
          "cost": 0.1439,
          "tokens": 137715,
          "time": 247.2
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": false,
          "cost": 0.2421,
          "tokens": 235634,
          "time": 153.7
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": true,
          "cost": 0.1433,
          "tokens": 136264,
          "time": 85.1
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": false,
          "cost": 0.1281,
          "tokens": 121784,
          "time": 87.3
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": true,
          "cost": 0.2993,
          "tokens": 292750,
          "time": 85.9
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 0.2015,
          "tokens": 193614,
          "time": 94.9
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": true,
          "cost": 0.1971,
          "tokens": 184258,
          "time": 103.6
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": true,
          "cost": 0.1188,
          "tokens": 109605,
          "time": 114.7
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": true,
          "cost": 0.0872,
          "tokens": 79442,
          "time": 211.2
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 0.0868,
          "tokens": 80599,
          "time": 147.3
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": true,
          "cost": 0.0875,
          "tokens": 82975,
          "time": 128.9
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": true,
          "cost": 0.0875,
          "tokens": 82162,
          "time": 154.1
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": true,
          "cost": 0.278,
          "tokens": 270986,
          "time": 165.1
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": true,
          "cost": 0.1861,
          "tokens": 178715,
          "time": 129.3
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": true,
          "cost": 0.1197,
          "tokens": 114060,
          "time": 148.1
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": false,
          "cost": 0.2348,
          "tokens": 226626,
          "time": 159.6
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": true,
          "cost": 0.2068,
          "tokens": 198150,
          "time": 157.9
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": true,
          "cost": 0.164,
          "tokens": 157719,
          "time": 150.7
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": false,
          "cost": 0.2817,
          "tokens": 275995,
          "time": 216.5
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": true,
          "cost": 0.2136,
          "tokens": 205542,
          "time": 219.6
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": false,
          "cost": 0.3577,
          "tokens": 350246,
          "time": 213.5
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": false,
          "cost": 0.1845,
          "tokens": 177673,
          "time": 206.4
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": false,
          "cost": 0.0857,
          "tokens": 80615,
          "time": 185.4
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": false,
          "cost": 0.1808,
          "tokens": 172881,
          "time": 229.6
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": false,
          "cost": 0.077,
          "tokens": 71604,
          "time": 202.1
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": false,
          "cost": 0.258,
          "tokens": 249962,
          "time": 227.0
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": true,
          "cost": 0.1149,
          "tokens": 108104,
          "time": 188.4
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": false,
          "cost": 0.0841,
          "tokens": 77493,
          "time": 202.1
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": true,
          "cost": 0.1054,
          "tokens": 100064,
          "time": 115.9
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": false,
          "cost": 0.0756,
          "tokens": 70412,
          "time": 102.5
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": false,
          "cost": 0.09,
          "tokens": 84247,
          "time": 109.5
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": true,
          "cost": 0.1185,
          "tokens": 113493,
          "time": 162.2
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": true,
          "cost": 0.2257,
          "tokens": 218409,
          "time": 173.7
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": false,
          "cost": 0.1983,
          "tokens": 192379,
          "time": 124.9
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": false,
          "cost": 0.2087,
          "tokens": 200356,
          "time": 170.9
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": false,
          "cost": 0.2582,
          "tokens": 251077,
          "time": 172.0
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": true,
          "cost": 0.0954,
          "tokens": 90753,
          "time": 138.5
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": true,
          "cost": 0.1731,
          "tokens": 166879,
          "time": 95.9
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": false,
          "cost": 0.0909,
          "tokens": 85683,
          "time": 93.2
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": true,
          "cost": 0.071,
          "tokens": 66059,
          "time": 112.3
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 0.177,
          "tokens": 170427,
          "time": 99.2
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 0.0707,
          "tokens": 65831,
          "time": 103.1
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 0.1245,
          "tokens": 118401,
          "time": 97.0
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 0.0937,
          "tokens": 87937,
          "time": 72.3
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": false,
          "cost": 0.1683,
          "tokens": 161438,
          "time": 90.1
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": true,
          "cost": 0.1781,
          "tokens": 172444,
          "time": 112.6
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 0.0904,
          "tokens": 85184,
          "time": 108.7
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": false,
          "cost": 0.091,
          "tokens": 86549,
          "time": 100.7
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": false,
          "cost": 0.485,
          "tokens": 474846,
          "time": 130.3
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": false,
          "cost": 0.1612,
          "tokens": 156363,
          "time": 100.3
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": false,
          "cost": 0.0756,
          "tokens": 70102,
          "time": 81.8
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": false,
          "cost": 0.058,
          "tokens": 53683,
          "time": 84.8
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": false,
          "cost": 0.2757,
          "tokens": 266674,
          "time": 107.1
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": false,
          "cost": 0.0756,
          "tokens": 70907,
          "time": 79.4
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 0.1174,
          "tokens": 110763,
          "time": 91.3
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 0.0792,
          "tokens": 73401,
          "time": 81.4
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": false,
          "cost": 0.0969,
          "tokens": 91622,
          "time": 78.8
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": true,
          "cost": 0.304,
          "tokens": 296998,
          "time": 81.2
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": true,
          "cost": 0.1422,
          "tokens": 136038,
          "time": 67.4
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": false,
          "cost": 0.0775,
          "tokens": 71726,
          "time": 64.0
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 0.2855,
          "tokens": 277667,
          "time": 89.3
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": false,
          "cost": 0.2431,
          "tokens": 236039,
          "time": 82.8
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 0.1838,
          "tokens": 177141,
          "time": 75.5
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": false,
          "cost": 0.2781,
          "tokens": 267812,
          "time": 86.7
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": false,
          "cost": 0.2599,
          "tokens": 252945,
          "time": 89.9
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": false,
          "cost": 0.5339,
          "tokens": 525475,
          "time": 116.8
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": false,
          "cost": 0.1959,
          "tokens": 184884,
          "time": 103.6
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": true,
          "cost": 0.2275,
          "tokens": 214139,
          "time": 119.1
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": false,
          "cost": 0.3426,
          "tokens": 334204,
          "time": 113.8
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": false,
          "cost": 0.1665,
          "tokens": 159324,
          "time": 93.9
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": true,
          "cost": 0.2186,
          "tokens": 212677,
          "time": 78.3
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": true,
          "cost": 0.1416,
          "tokens": 136286,
          "time": 82.3
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 0.3435,
          "tokens": 335220,
          "time": 125.6
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": true,
          "cost": 0.3145,
          "tokens": 308230,
          "time": 79.4
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": false,
          "cost": 0.18,
          "tokens": 172703,
          "time": 74.2
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": true,
          "cost": 0.1416,
          "tokens": 134886,
          "time": 75.0
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 0.2275,
          "tokens": 220146,
          "time": 82.0
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": true,
          "cost": 0.139,
          "tokens": 132040,
          "time": 76.6
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": false,
          "cost": 0.3023,
          "tokens": 294310,
          "time": 85.3
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": false,
          "cost": 0.0906,
          "tokens": 84420,
          "time": 81.2
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": false,
          "cost": 0.3583,
          "tokens": 346798,
          "time": 103.5
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 0.0915,
          "tokens": 87051,
          "time": 60.8
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": true,
          "cost": 0.0887,
          "tokens": 84077,
          "time": 60.4
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": true,
          "cost": 0.3221,
          "tokens": 314244,
          "time": 96.2
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": true,
          "cost": 0.2318,
          "tokens": 223048,
          "time": 73.8
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": false,
          "cost": 0.0912,
          "tokens": 86208,
          "time": 69.6
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": true,
          "cost": 0.5607,
          "tokens": 546242,
          "time": 106.0
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 0.1316,
          "tokens": 126867,
          "time": 69.8
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 0.0895,
          "tokens": 84147,
          "time": 60.5
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.0999,
          "tokens": 92348,
          "time": 73.9
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": true,
          "cost": 0.3734,
          "tokens": 363115,
          "time": 91.6
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": false,
          "cost": 0.1696,
          "tokens": 160714,
          "time": 66.8
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": false,
          "cost": 0.2085,
          "tokens": 201479,
          "time": 64.0
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": false,
          "cost": 0.1241,
          "tokens": 119194,
          "time": 53.1
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": true,
          "cost": 0.0918,
          "tokens": 86903,
          "time": 49.6
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": true,
          "cost": 0.1722,
          "tokens": 166732,
          "time": 48.3
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 0.1421,
          "tokens": 134693,
          "time": 53.5
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": true,
          "cost": 0.3264,
          "tokens": 314074,
          "time": 92.2
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": false,
          "cost": 0.2067,
          "tokens": 200114,
          "time": 58.3
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": true,
          "cost": 0.1948,
          "tokens": 187542,
          "time": 45.2
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": false,
          "cost": 0.1144,
          "tokens": 108481,
          "time": 37.7
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 0.089,
          "tokens": 83705,
          "time": 34.9
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": false,
          "cost": 0.1655,
          "tokens": 156957,
          "time": 49.9
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 0.0836,
          "tokens": 77724,
          "time": 34.9
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 0.1257,
          "tokens": 113685,
          "time": 51.2
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 0.1129,
          "tokens": 101656,
          "time": 47.7
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": false,
          "cost": 0.2942,
          "tokens": 285303,
          "time": 51.7
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": false,
          "cost": 0.3474,
          "tokens": 337939,
          "time": 53.1
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 0.0878,
          "tokens": 81856,
          "time": 29.6
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": false,
          "cost": 0.1273,
          "tokens": 121775,
          "time": 32.7
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": false,
          "cost": 0.1762,
          "tokens": 169059,
          "time": 35.4
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 0.0868,
          "tokens": 80543,
          "time": 30.2
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 0.1106,
          "tokens": 103981,
          "time": 34.5
        }
      ]
    },
    {
      "runKey": "claudecode-sonnet-4.5",
      "harness": "claude-code",
      "model": "claude-sonnet-4.5",
      "modelName": "claude-sonnet-4.5",
      "reported": {
        "cost": 0.454,
        "tokens": 907000,
        "time": 130,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": false,
          "cost": 0.4659,
          "tokens": 912376,
          "time": 101.7
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": false,
          "cost": 0.3235,
          "tokens": 632677,
          "time": 73.7
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": true,
          "cost": 0.6905,
          "tokens": 1416669,
          "time": 148.9
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": false,
          "cost": 0.3513,
          "tokens": 603311,
          "time": 65.2
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": false,
          "cost": 0.4913,
          "tokens": 835792,
          "time": 119.4
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": true,
          "cost": 0.4788,
          "tokens": 860518,
          "time": 91.4
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": false,
          "cost": 0.5618,
          "tokens": 914324,
          "time": 114.5
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": true,
          "cost": 0.4848,
          "tokens": 969221,
          "time": 109.9
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": false,
          "cost": 0.853,
          "tokens": 1780727,
          "time": 205.9
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": true,
          "cost": 0.3951,
          "tokens": 597273,
          "time": 70.5
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": false,
          "cost": 0.471,
          "tokens": 971056,
          "time": 122.9
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": false,
          "cost": 0.3997,
          "tokens": 723673,
          "time": 128.8
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": false,
          "cost": 0.3577,
          "tokens": 559441,
          "time": 69.4
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": false,
          "cost": 0.278,
          "tokens": 508018,
          "time": 74.7
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": false,
          "cost": 0.5927,
          "tokens": 1257107,
          "time": 157.1
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": false,
          "cost": 0.3123,
          "tokens": 535427,
          "time": 81.6
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 0.5458,
          "tokens": 1142764,
          "time": 139.4
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": true,
          "cost": 0.6324,
          "tokens": 1459470,
          "time": 142.5
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": true,
          "cost": 0.1821,
          "tokens": 338144,
          "time": 45.7
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": false,
          "cost": 0.6978,
          "tokens": 1492810,
          "time": 1820.3
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 0.671,
          "tokens": 1459985,
          "time": 156.4
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": false,
          "cost": 0.5441,
          "tokens": 1186005,
          "time": 138.8
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 0.6015,
          "tokens": 1135305,
          "time": 147.2
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 0.4191,
          "tokens": 799760,
          "time": 115.1
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": true,
          "cost": 0.4619,
          "tokens": 919997,
          "time": 112.4
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 0.4168,
          "tokens": 756773,
          "time": 111.8
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 0.3705,
          "tokens": 684932,
          "time": 113.0
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 0.3261,
          "tokens": 637869,
          "time": 100.2
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 0.8705,
          "tokens": 1832187,
          "time": 264.2
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 0.4609,
          "tokens": 927002,
          "time": 115.8
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": false,
          "cost": 0.3801,
          "tokens": 653622,
          "time": 63.9
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": false,
          "cost": 0.5763,
          "tokens": 1207012,
          "time": 142.1
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": true,
          "cost": 0.6849,
          "tokens": 1375414,
          "time": 166.1
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": false,
          "cost": 0.2811,
          "tokens": 492854,
          "time": 84.2
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 0.573,
          "tokens": 1220348,
          "time": 153.7
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": false,
          "cost": 0.319,
          "tokens": 608952,
          "time": 72.0
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 0.4001,
          "tokens": 781485,
          "time": 96.8
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 0.4083,
          "tokens": 740266,
          "time": 105.1
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": false,
          "cost": 0.3861,
          "tokens": 622299,
          "time": 137.4
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 0.6154,
          "tokens": 1151325,
          "time": 254.4
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": true,
          "cost": 0.9408,
          "tokens": 2162601,
          "time": 249.4
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 0.6949,
          "tokens": 1520106,
          "time": 176.4
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": true,
          "cost": 0.2453,
          "tokens": 373016,
          "time": 59.7
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": true,
          "cost": 0.3178,
          "tokens": 646850,
          "time": 81.0
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": false,
          "cost": 0.3594,
          "tokens": 676692,
          "time": 96.3
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 0.3771,
          "tokens": 827398,
          "time": 98.0
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": false,
          "cost": 0.3914,
          "tokens": 741194,
          "time": 88.0
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": false,
          "cost": 0.1796,
          "tokens": 361490,
          "time": 46.7
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": false,
          "cost": 0.2545,
          "tokens": 505500,
          "time": 68.2
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": true,
          "cost": 0.3836,
          "tokens": 626929,
          "time": 67.3
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": true,
          "cost": 0.5065,
          "tokens": 1020625,
          "time": 140.1
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": false,
          "cost": 0.3571,
          "tokens": 616550,
          "time": 70.9
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": false,
          "cost": 0.3835,
          "tokens": 835734,
          "time": 105.0
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": false,
          "cost": 0.5767,
          "tokens": 1009256,
          "time": 165.1
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 0.3005,
          "tokens": 509017,
          "time": 61.2
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 0.361,
          "tokens": 752830,
          "time": 92.0
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": false,
          "cost": 0.2626,
          "tokens": 577104,
          "time": 66.0
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": true,
          "cost": 0.6165,
          "tokens": 1102490,
          "time": 83.5
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 0.4378,
          "tokens": 991276,
          "time": 115.0
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": false,
          "cost": 0.3257,
          "tokens": 590390,
          "time": 68.8
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": false,
          "cost": 0.1951,
          "tokens": 481277,
          "time": 52.9
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 0.4532,
          "tokens": 937477,
          "time": 111.1
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": false,
          "cost": 0.7198,
          "tokens": 1464018,
          "time": 206.3
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": true,
          "cost": 0.3157,
          "tokens": 606687,
          "time": 115.1
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": false,
          "cost": 0.4756,
          "tokens": 972431,
          "time": 113.0
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": true,
          "cost": 0.3425,
          "tokens": 664515,
          "time": 96.1
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": false,
          "cost": 0.4903,
          "tokens": 1005285,
          "time": 157.4
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": false,
          "cost": 0.457,
          "tokens": 958778,
          "time": 113.0
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": true,
          "cost": 0.4543,
          "tokens": 991467,
          "time": 97.7
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": false,
          "cost": 0.343,
          "tokens": 714549,
          "time": 74.0
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": true,
          "cost": 0.4059,
          "tokens": 856837,
          "time": 112.7
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": false,
          "cost": 0.5515,
          "tokens": 990033,
          "time": 154.1
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 0.1797,
          "tokens": 331181,
          "time": 53.3
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 0.3184,
          "tokens": 586965,
          "time": 80.0
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": false,
          "cost": 0.3675,
          "tokens": 658740,
          "time": 76.6
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": false,
          "cost": 0.5402,
          "tokens": 771944,
          "time": 104.2
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 0.4536,
          "tokens": 883207,
          "time": 128.9
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": false,
          "cost": 0.4613,
          "tokens": 798450,
          "time": 145.0
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 0.5299,
          "tokens": 1080187,
          "time": 140.0
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 0.1847,
          "tokens": 365928,
          "time": 46.6
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.2623,
          "tokens": 531265,
          "time": 54.4
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": false,
          "cost": 0.3951,
          "tokens": 840490,
          "time": 113.3
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": true,
          "cost": 0.2346,
          "tokens": 454770,
          "time": 58.0
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": false,
          "cost": 0.639,
          "tokens": 1276185,
          "time": 107.0
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": false,
          "cost": 0.3666,
          "tokens": 710498,
          "time": 77.0
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": false,
          "cost": 0.1926,
          "tokens": 355342,
          "time": 45.5
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": false,
          "cost": 0.3624,
          "tokens": 747622,
          "time": 98.8
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 0.5023,
          "tokens": 1030696,
          "time": 122.7
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": false,
          "cost": 0.3969,
          "tokens": 718444,
          "time": 101.4
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": true,
          "cost": 0.7693,
          "tokens": 1616026,
          "time": 199.0
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": false,
          "cost": 0.5596,
          "tokens": 1098235,
          "time": 131.5
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 0.5172,
          "tokens": 959746,
          "time": 142.1
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": false,
          "cost": 0.3445,
          "tokens": 536201,
          "time": 47.6
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": true,
          "cost": 0.3118,
          "tokens": 450071,
          "time": 74.3
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": true,
          "cost": 0.3958,
          "tokens": 893273,
          "time": 105.1
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": true,
          "cost": 0.4024,
          "tokens": 837449,
          "time": 98.9
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": false,
          "cost": 0.2704,
          "tokens": 501940,
          "time": 69.5
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": true,
          "cost": 0.3378,
          "tokens": 562204,
          "time": 67.2
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": false,
          "cost": 0.8116,
          "tokens": 1814565,
          "time": 193.9
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": false,
          "cost": 0.4251,
          "tokens": 770224,
          "time": 88.1
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": true,
          "cost": 0.3106,
          "tokens": 612066,
          "time": 83.7
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": true,
          "cost": 0.5659,
          "tokens": 1075955,
          "time": 168.7
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": true,
          "cost": 0.3185,
          "tokens": 658676,
          "time": 91.2
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": false,
          "cost": 0.7483,
          "tokens": 1523565,
          "time": 190.9
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": false,
          "cost": 0.6061,
          "tokens": 1255736,
          "time": 154.9
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": false,
          "cost": 0.5946,
          "tokens": 1220564,
          "time": 171.4
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": false,
          "cost": 0.8867,
          "tokens": 1734852,
          "time": 170.9
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": false,
          "cost": 0.4541,
          "tokens": 846657,
          "time": 112.3
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": true,
          "cost": 0.6606,
          "tokens": 1393988,
          "time": 161.6
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": false,
          "cost": 0.7711,
          "tokens": 1759589,
          "time": 178.9
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": true,
          "cost": 0.4073,
          "tokens": 756958,
          "time": 102.7
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": false,
          "cost": 0.2374,
          "tokens": 442827,
          "time": 62.0
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": false,
          "cost": 0.5036,
          "tokens": 1186501,
          "time": 124.0
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": false,
          "cost": 0.5899,
          "tokens": 1149831,
          "time": 191.9
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": false,
          "cost": 0.4411,
          "tokens": 931689,
          "time": 103.8
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": false,
          "cost": 0.4817,
          "tokens": 1030430,
          "time": 123.0
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": false,
          "cost": 0.5974,
          "tokens": 1299377,
          "time": 161.2
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": false,
          "cost": 0.7894,
          "tokens": 1837194,
          "time": 207.1
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": true,
          "cost": 0.2436,
          "tokens": 449725,
          "time": 61.2
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": true,
          "cost": 0.358,
          "tokens": 724148,
          "time": 89.3
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": false,
          "cost": 0.7664,
          "tokens": 1724374,
          "time": 168.3
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": false,
          "cost": 0.3428,
          "tokens": 661391,
          "time": 84.5
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 0.3182,
          "tokens": 606825,
          "time": 83.5
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 0.3547,
          "tokens": 711475,
          "time": 93.7
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 0.3007,
          "tokens": 626232,
          "time": 60.4
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 0.436,
          "tokens": 733926,
          "time": 91.1
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": false,
          "cost": 0.5894,
          "tokens": 1239980,
          "time": 140.3
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": false,
          "cost": 0.7254,
          "tokens": 1619378,
          "time": 196.3
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 0.5711,
          "tokens": 1182668,
          "time": 126.5
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": false,
          "cost": 0.4443,
          "tokens": 956813,
          "time": 98.8
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": true,
          "cost": 0.3295,
          "tokens": 637912,
          "time": 82.3
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": false,
          "cost": 0.2992,
          "tokens": 681155,
          "time": 72.0
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": true,
          "cost": 0.1576,
          "tokens": 254612,
          "time": 37.2
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": true,
          "cost": 0.3872,
          "tokens": 782054,
          "time": 89.5
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": false,
          "cost": 0.2541,
          "tokens": 473040,
          "time": 58.5
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": false,
          "cost": 0.2031,
          "tokens": 439524,
          "time": 55.7
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 0.5119,
          "tokens": 1038328,
          "time": 86.6
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 0.2956,
          "tokens": 455086,
          "time": 63.7
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": true,
          "cost": 0.4624,
          "tokens": 986839,
          "time": 101.0
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": true,
          "cost": 0.2457,
          "tokens": 427662,
          "time": 51.7
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": false,
          "cost": 0.1518,
          "tokens": 315160,
          "time": 41.5
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": true,
          "cost": 0.5904,
          "tokens": 1301222,
          "time": 121.1
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 0.3651,
          "tokens": 741549,
          "time": 88.3
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": true,
          "cost": 0.4506,
          "tokens": 980144,
          "time": 111.2
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 0.5536,
          "tokens": 1188789,
          "time": 124.8
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": true,
          "cost": 0.3611,
          "tokens": 674559,
          "time": 85.5
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": false,
          "cost": 0.4588,
          "tokens": 904600,
          "time": 128.2
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": true,
          "cost": 0.7196,
          "tokens": 1390008,
          "time": 138.0
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": false,
          "cost": 0.7011,
          "tokens": 1579485,
          "time": 184.5
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": true,
          "cost": 0.5755,
          "tokens": 1067112,
          "time": 152.5
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": true,
          "cost": 0.4522,
          "tokens": 870900,
          "time": 98.7
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": true,
          "cost": 0.4496,
          "tokens": 899736,
          "time": 110.7
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 0.5322,
          "tokens": 1156924,
          "time": 140.4
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 0.6077,
          "tokens": 1281460,
          "time": 166.2
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 0.5008,
          "tokens": 975939,
          "time": 1820.3
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": false,
          "cost": 0.658,
          "tokens": 1356334,
          "time": 145.1
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": false,
          "cost": 0.5576,
          "tokens": 1152872,
          "time": 135.9
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": true,
          "cost": 0.5244,
          "tokens": 1088688,
          "time": 142.9
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 0.4347,
          "tokens": 860673,
          "time": 100.8
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": false,
          "cost": 0.6665,
          "tokens": 1384458,
          "time": 180.4
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": false,
          "cost": 0.3285,
          "tokens": 604387,
          "time": 84.1
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": false,
          "cost": 0.7341,
          "tokens": 1583552,
          "time": 197.3
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": false,
          "cost": 0.4232,
          "tokens": 874424,
          "time": 97.2
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 0.245,
          "tokens": 493425,
          "time": 67.9
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": true,
          "cost": 0.4684,
          "tokens": 843541,
          "time": 68.2
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": true,
          "cost": 0.5132,
          "tokens": 927937,
          "time": 113.0
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": false,
          "cost": 0.2816,
          "tokens": 556405,
          "time": 67.7
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": false,
          "cost": 0.3114,
          "tokens": 651013,
          "time": 74.3
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": false,
          "cost": 0.6155,
          "tokens": 1335516,
          "time": 153.5
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 0.5604,
          "tokens": 1215787,
          "time": 113.8
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 0.5364,
          "tokens": 1119333,
          "time": 122.4
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.4341,
          "tokens": 953619,
          "time": 88.2
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": true,
          "cost": 0.4725,
          "tokens": 862483,
          "time": 132.1
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": true,
          "cost": 0.362,
          "tokens": 783902,
          "time": 94.9
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": false,
          "cost": 0.4886,
          "tokens": 953637,
          "time": 101.4
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": false,
          "cost": 0.375,
          "tokens": 778590,
          "time": 83.5
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": true,
          "cost": 0.3243,
          "tokens": 675329,
          "time": 74.7
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": true,
          "cost": 0.5846,
          "tokens": 1292704,
          "time": 114.6
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 0.6295,
          "tokens": 1296405,
          "time": 159.9
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": false,
          "cost": 0.4348,
          "tokens": 871357,
          "time": 130.1
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": false,
          "cost": 0.5906,
          "tokens": 1298715,
          "time": 155.3
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": false,
          "cost": 0.4248,
          "tokens": 810145,
          "time": 130.1
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": false,
          "cost": 0.3026,
          "tokens": 643279,
          "time": 84.7
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 0.3703,
          "tokens": 757495,
          "time": 97.6
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": true,
          "cost": 0.3,
          "tokens": 605447,
          "time": 73.6
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 0.4846,
          "tokens": 1041143,
          "time": 110.9
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 0.4713,
          "tokens": 960172,
          "time": 151.9
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 0.2734,
          "tokens": 520253,
          "time": 84.1
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": true,
          "cost": 0.4354,
          "tokens": 749855,
          "time": 69.8
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": false,
          "cost": 0.5837,
          "tokens": 1234066,
          "time": 134.3
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 0.2493,
          "tokens": 333426,
          "time": 55.6
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": false,
          "cost": 0.6477,
          "tokens": 1459810,
          "time": 149.2
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": false,
          "cost": 0.5627,
          "tokens": 1130171,
          "time": 139.4
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 0.1918,
          "tokens": 363996,
          "time": 60.1
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 0.1958,
          "tokens": 373896,
          "time": 55.3
        }
      ]
    },
    {
      "runKey": "hermes-sonnet-4.5",
      "harness": "hermes",
      "model": "claude-sonnet-4.5",
      "modelName": "claude-sonnet-4.5",
      "reported": {
        "cost": 0.629,
        "tokens": 198000,
        "time": 130,
        "tokensEstimated": true
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": false,
          "cost": 0.4608,
          "tokens": null,
          "time": 124.7
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": false,
          "cost": 0.8403,
          "tokens": null,
          "time": 152.1
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": false,
          "cost": 0.511,
          "tokens": null,
          "time": 105.9
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": false,
          "cost": 0.4434,
          "tokens": null,
          "time": 117.2
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": false,
          "cost": 0.3817,
          "tokens": null,
          "time": 117.2
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": true,
          "cost": 0.2869,
          "tokens": null,
          "time": 78.1
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": true,
          "cost": 0.2171,
          "tokens": null,
          "time": 80.1
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": true,
          "cost": 1.1057,
          "tokens": null,
          "time": 138.5
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": true,
          "cost": 0.8358,
          "tokens": null,
          "time": 193.7
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": false,
          "cost": 0.5455,
          "tokens": null,
          "time": 130.3
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": false,
          "cost": 0.3241,
          "tokens": null,
          "time": 106.4
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": false,
          "cost": 0.6617,
          "tokens": null,
          "time": 146.6
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": false,
          "cost": 0.2135,
          "tokens": null,
          "time": 99.9
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": false,
          "cost": 0.4692,
          "tokens": null,
          "time": 139.3
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": false,
          "cost": 0.6899,
          "tokens": null,
          "time": 118.3
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": false,
          "cost": 0.2434,
          "tokens": null,
          "time": 84.6
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 0.4427,
          "tokens": null,
          "time": 114.8
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": false,
          "cost": 0.3702,
          "tokens": null,
          "time": 90.8
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": false,
          "cost": 0.3206,
          "tokens": null,
          "time": 111.7
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": false,
          "cost": 0.3973,
          "tokens": null,
          "time": 98.1
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 0.5207,
          "tokens": null,
          "time": 137.7
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": true,
          "cost": 0.5657,
          "tokens": null,
          "time": 125.7
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 0.2526,
          "tokens": null,
          "time": 98.3
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 0.8226,
          "tokens": null,
          "time": 172.4
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": false,
          "cost": 0.3484,
          "tokens": null,
          "time": 134.9
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 0.3638,
          "tokens": null,
          "time": 100.3
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 0.5447,
          "tokens": null,
          "time": 88.0
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 0.2392,
          "tokens": null,
          "time": 101.2
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 0.35,
          "tokens": null,
          "time": 110.0
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 0.5004,
          "tokens": null,
          "time": 133.7
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": true,
          "cost": 0.2984,
          "tokens": null,
          "time": 86.5
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": false,
          "cost": 1.1729,
          "tokens": null,
          "time": 140.5
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": false,
          "cost": 0.8513,
          "tokens": null,
          "time": 150.6
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": false,
          "cost": 1.1638,
          "tokens": null,
          "time": 138.7
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 0.8512,
          "tokens": null,
          "time": 154.6
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": false,
          "cost": 0.7984,
          "tokens": null,
          "time": 140.0
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 1.1833,
          "tokens": null,
          "time": 111.3
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 0.4867,
          "tokens": null,
          "time": 152.1
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": true,
          "cost": 0.4538,
          "tokens": null,
          "time": 156.0
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 0.5901,
          "tokens": null,
          "time": 129.2
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": false,
          "cost": 0.236,
          "tokens": null,
          "time": 75.2
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 0.6284,
          "tokens": null,
          "time": 140.9
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": false,
          "cost": 0.4115,
          "tokens": null,
          "time": 153.0
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": false,
          "cost": 0.5947,
          "tokens": null,
          "time": 121.5
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": false,
          "cost": 0.3628,
          "tokens": null,
          "time": 97.0
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 0.8994,
          "tokens": null,
          "time": 161.0
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": false,
          "cost": 0.6709,
          "tokens": null,
          "time": 102.3
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": false,
          "cost": 0.6801,
          "tokens": null,
          "time": 139.2
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": false,
          "cost": 0.7531,
          "tokens": null,
          "time": 140.2
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": false,
          "cost": 0.754,
          "tokens": null,
          "time": 120.8
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": false,
          "cost": 0.4713,
          "tokens": null,
          "time": 112.3
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": false,
          "cost": 0.8784,
          "tokens": null,
          "time": 147.6
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": false,
          "cost": 1.0679,
          "tokens": null,
          "time": 153.2
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": false,
          "cost": 0.6667,
          "tokens": null,
          "time": 167.9
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 0.5166,
          "tokens": null,
          "time": 140.3
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 0.9137,
          "tokens": null,
          "time": 179.2
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 0.3974,
          "tokens": null,
          "time": 104.8
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": true,
          "cost": 0.606,
          "tokens": null,
          "time": 174.9
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 0.3996,
          "tokens": null,
          "time": 111.8
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": true,
          "cost": 0.435,
          "tokens": null,
          "time": 114.7
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": false,
          "cost": 0.3056,
          "tokens": null,
          "time": 102.6
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 0.4321,
          "tokens": null,
          "time": 111.0
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": true,
          "cost": 0.7265,
          "tokens": null,
          "time": 114.3
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": false,
          "cost": 0.9501,
          "tokens": null,
          "time": 132.5
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": false,
          "cost": 1.009,
          "tokens": null,
          "time": 142.9
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": false,
          "cost": 0.7087,
          "tokens": null,
          "time": 98.4
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": false,
          "cost": 0.9773,
          "tokens": null,
          "time": 132.2
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": true,
          "cost": 1.0719,
          "tokens": null,
          "time": 111.8
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": true,
          "cost": 0.8225,
          "tokens": null,
          "time": 110.8
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": true,
          "cost": 0.3527,
          "tokens": null,
          "time": 77.5
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": true,
          "cost": 0.5551,
          "tokens": null,
          "time": 133.2
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": false,
          "cost": 0.6552,
          "tokens": null,
          "time": 170.5
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 0.2825,
          "tokens": null,
          "time": 105.3
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": true,
          "cost": 0.446,
          "tokens": null,
          "time": 125.6
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": false,
          "cost": 0.3523,
          "tokens": null,
          "time": 113.6
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": true,
          "cost": 0.4916,
          "tokens": null,
          "time": 110.2
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": true,
          "cost": 0.3835,
          "tokens": null,
          "time": 128.2
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": true,
          "cost": 0.3432,
          "tokens": null,
          "time": 124.5
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 0.4207,
          "tokens": null,
          "time": 101.9
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 0.5585,
          "tokens": null,
          "time": 134.4
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": false,
          "cost": 0.5324,
          "tokens": null,
          "time": 84.3
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": false,
          "cost": 0.4915,
          "tokens": null,
          "time": 113.8
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": true,
          "cost": 1.9102,
          "tokens": null,
          "time": 148.8
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": false,
          "cost": 0.564,
          "tokens": null,
          "time": 159.9
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": false,
          "cost": 0.9612,
          "tokens": null,
          "time": 132.4
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": false,
          "cost": 0.7258,
          "tokens": null,
          "time": 117.0
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": false,
          "cost": 0.3444,
          "tokens": null,
          "time": 81.4
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 1.1779,
          "tokens": null,
          "time": 169.6
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": false,
          "cost": 0.5318,
          "tokens": null,
          "time": 107.3
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": false,
          "cost": 0.3279,
          "tokens": null,
          "time": 111.6
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": false,
          "cost": 0.4118,
          "tokens": null,
          "time": 108.2
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 0.632,
          "tokens": null,
          "time": 131.5
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": false,
          "cost": 0.6915,
          "tokens": null,
          "time": 121.1
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": false,
          "cost": 0.8184,
          "tokens": null,
          "time": 168.1
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": false,
          "cost": 1.028,
          "tokens": null,
          "time": 157.3
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": false,
          "cost": 0.5283,
          "tokens": null,
          "time": 156.7
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": false,
          "cost": 1.2871,
          "tokens": null,
          "time": 230.7
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": false,
          "cost": 0.2393,
          "tokens": null,
          "time": 84.5
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": false,
          "cost": 0.5255,
          "tokens": null,
          "time": 120.4
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": false,
          "cost": 0.8582,
          "tokens": null,
          "time": 157.9
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": false,
          "cost": 0.8746,
          "tokens": null,
          "time": 127.3
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": false,
          "cost": 0.6798,
          "tokens": null,
          "time": 147.1
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": false,
          "cost": 0.4678,
          "tokens": null,
          "time": 120.3
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": true,
          "cost": 0.4365,
          "tokens": null,
          "time": 99.4
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": true,
          "cost": 0.3442,
          "tokens": null,
          "time": 110.6
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": false,
          "cost": 0.6495,
          "tokens": null,
          "time": 120.6
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": false,
          "cost": 0.9139,
          "tokens": null,
          "time": 125.0
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": false,
          "cost": 1.427,
          "tokens": null,
          "time": 174.8
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": true,
          "cost": 1.1537,
          "tokens": null,
          "time": 153.3
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": false,
          "cost": 0.3627,
          "tokens": null,
          "time": 98.1
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": false,
          "cost": 0.2818,
          "tokens": null,
          "time": 87.7
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": false,
          "cost": 0.2801,
          "tokens": null,
          "time": 85.9
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": false,
          "cost": 1.0537,
          "tokens": null,
          "time": 155.7
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": true,
          "cost": 0.6945,
          "tokens": null,
          "time": 139.3
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": true,
          "cost": 0.4864,
          "tokens": null,
          "time": 122.9
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": true,
          "cost": 0.3093,
          "tokens": null,
          "time": 110.0
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": true,
          "cost": 0.295,
          "tokens": null,
          "time": 84.7
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": true,
          "cost": 0.1915,
          "tokens": null,
          "time": 77.1
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": true,
          "cost": 0.9127,
          "tokens": null,
          "time": 141.5
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": true,
          "cost": 0.6368,
          "tokens": null,
          "time": 117.7
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": false,
          "cost": 0.7041,
          "tokens": null,
          "time": 154.8
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": true,
          "cost": 0.7591,
          "tokens": null,
          "time": 163.6
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 0.9944,
          "tokens": null,
          "time": 200.3
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 0.9756,
          "tokens": null,
          "time": 184.6
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 1.1586,
          "tokens": null,
          "time": 117.3
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 0.4712,
          "tokens": null,
          "time": 121.8
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": false,
          "cost": 1.6726,
          "tokens": null,
          "time": 186.3
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": true,
          "cost": 2.1684,
          "tokens": null,
          "time": 174.3
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": true,
          "cost": 0.3919,
          "tokens": null,
          "time": 111.7
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": false,
          "cost": 0.3389,
          "tokens": null,
          "time": 101.4
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": false,
          "cost": 0.5603,
          "tokens": null,
          "time": 119.7
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": false,
          "cost": 0.8287,
          "tokens": null,
          "time": 140.2
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": true,
          "cost": 0.5572,
          "tokens": null,
          "time": 129.9
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": true,
          "cost": 0.2731,
          "tokens": null,
          "time": 79.8
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": false,
          "cost": 0.2563,
          "tokens": null,
          "time": 83.1
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": false,
          "cost": 0.2852,
          "tokens": null,
          "time": 95.6
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 0.9944,
          "tokens": null,
          "time": 162.7
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 0.4587,
          "tokens": null,
          "time": 115.4
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": true,
          "cost": 0.5895,
          "tokens": null,
          "time": 130.1
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": true,
          "cost": 0.8037,
          "tokens": null,
          "time": 122.1
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": true,
          "cost": 0.5245,
          "tokens": null,
          "time": 140.2
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": true,
          "cost": 0.4565,
          "tokens": null,
          "time": 119.5
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 0.9232,
          "tokens": null,
          "time": 217.9
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": false,
          "cost": 1.0362,
          "tokens": null,
          "time": 192.5
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 0.2827,
          "tokens": null,
          "time": 119.5
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": false,
          "cost": 0.8464,
          "tokens": null,
          "time": 159.3
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": false,
          "cost": 0.1788,
          "tokens": null,
          "time": 94.6
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": true,
          "cost": 0.3543,
          "tokens": null,
          "time": 97.9
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": false,
          "cost": 0.7339,
          "tokens": null,
          "time": 155.2
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": false,
          "cost": 0.4209,
          "tokens": null,
          "time": 153.3
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": false,
          "cost": 0.3802,
          "tokens": null,
          "time": 121.9
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": false,
          "cost": 0.9421,
          "tokens": null,
          "time": 136.6
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 0.5961,
          "tokens": null,
          "time": 163.4
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 0.9933,
          "tokens": null,
          "time": 152.2
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 1.2911,
          "tokens": null,
          "time": 187.5
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": false,
          "cost": 0.5874,
          "tokens": null,
          "time": 126.2
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": false,
          "cost": 0.5788,
          "tokens": null,
          "time": 124.5
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": false,
          "cost": 0.2344,
          "tokens": null,
          "time": 93.5
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 0.5496,
          "tokens": null,
          "time": 144.7
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": false,
          "cost": 1.2585,
          "tokens": null,
          "time": 215.8
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": false,
          "cost": 0.4964,
          "tokens": null,
          "time": 170.7
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": false,
          "cost": 0.5461,
          "tokens": null,
          "time": 131.0
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": false,
          "cost": 0.5852,
          "tokens": null,
          "time": 174.1
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": false,
          "cost": 0.7875,
          "tokens": null,
          "time": 141.2
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": false,
          "cost": 0.7693,
          "tokens": null,
          "time": 175.9
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": false,
          "cost": 0.6292,
          "tokens": null,
          "time": 129.0
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": false,
          "cost": 0.5784,
          "tokens": null,
          "time": 98.5
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": true,
          "cost": 0.5824,
          "tokens": null,
          "time": 105.8
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": true,
          "cost": 0.3833,
          "tokens": null,
          "time": 134.1
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": false,
          "cost": 0.1383,
          "tokens": null,
          "time": 89.2
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 0.5582,
          "tokens": null,
          "time": 167.1
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.4699,
          "tokens": null,
          "time": 121.2
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": false,
          "cost": 0.5636,
          "tokens": null,
          "time": 143.9
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": false,
          "cost": 0.282,
          "tokens": null,
          "time": 117.2
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": false,
          "cost": 0.408,
          "tokens": null,
          "time": 141.1
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": true,
          "cost": 0.3652,
          "tokens": null,
          "time": 100.8
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": false,
          "cost": 0.8093,
          "tokens": null,
          "time": 179.8
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": true,
          "cost": 0.5109,
          "tokens": null,
          "time": 122.0
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 0.752,
          "tokens": null,
          "time": 150.3
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": true,
          "cost": 0.4913,
          "tokens": null,
          "time": 140.2
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": true,
          "cost": 1.3407,
          "tokens": null,
          "time": 157.6
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": true,
          "cost": 0.9285,
          "tokens": null,
          "time": 207.0
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": false,
          "cost": 0.6289,
          "tokens": null,
          "time": 128.0
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 0.4607,
          "tokens": null,
          "time": 143.9
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": false,
          "cost": 0.7051,
          "tokens": null,
          "time": 128.9
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 0.4384,
          "tokens": null,
          "time": 93.9
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 0.3492,
          "tokens": null,
          "time": 101.8
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": true,
          "cost": 0.9011,
          "tokens": null,
          "time": 166.0
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": false,
          "cost": 0.6585,
          "tokens": null,
          "time": 122.3
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": true,
          "cost": 0.5382,
          "tokens": null,
          "time": 114.3
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 0.8642,
          "tokens": null,
          "time": 200.1
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": true,
          "cost": 0.5727,
          "tokens": null,
          "time": 148.9
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": false,
          "cost": 0.2779,
          "tokens": null,
          "time": 106.4
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 0.2036,
          "tokens": null,
          "time": 106.1
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 1.3182,
          "tokens": null,
          "time": 172.5
        }
      ]
    },
    {
      "runKey": "rlm-gpt-5-mini",
      "harness": "trace-rlm",
      "model": "gpt-5-mini",
      "modelName": "gpt-5-mini",
      "reported": {
        "cost": 0.076,
        "tokens": 340000,
        "time": 203,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": false,
          "cost": 0.0128,
          "tokens": 42076,
          "time": 91.0
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": false,
          "cost": 0.0582,
          "tokens": 190964,
          "time": 142.7
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": false,
          "cost": 0.0239,
          "tokens": 88360,
          "time": 136.6
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": false,
          "cost": 0.0201,
          "tokens": 73352,
          "time": 80.8
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": false,
          "cost": 0.0558,
          "tokens": 213154,
          "time": 156.1
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": false,
          "cost": 0.0081,
          "tokens": 30692,
          "time": 86.4
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": false,
          "cost": 0.0444,
          "tokens": 167283,
          "time": 209.8
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": false,
          "cost": 0.0217,
          "tokens": 80748,
          "time": 104.7
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": true,
          "cost": 0.07,
          "tokens": 282108,
          "time": 232.7
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": false,
          "cost": 0.036,
          "tokens": 142522,
          "time": 155.7
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": false,
          "cost": 0.0191,
          "tokens": 67295,
          "time": 102.5
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": true,
          "cost": 0.0711,
          "tokens": 275710,
          "time": 264.0
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": false,
          "cost": 0.0289,
          "tokens": 94895,
          "time": 201.9
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": false,
          "cost": 0.0165,
          "tokens": 61181,
          "time": 103.8
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": false,
          "cost": 0.0236,
          "tokens": 82378,
          "time": 105.8
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": false,
          "cost": 0.0347,
          "tokens": 139160,
          "time": 156.2
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 0.0425,
          "tokens": 173829,
          "time": 178.7
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": true,
          "cost": 0.0232,
          "tokens": 66747,
          "time": 114.3
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": false,
          "cost": 0.0293,
          "tokens": 61263,
          "time": 191.8
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": false,
          "cost": 0.0126,
          "tokens": 26084,
          "time": 104.0
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 0.0242,
          "tokens": 79941,
          "time": 125.6
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": false,
          "cost": 0.0258,
          "tokens": 87900,
          "time": 89.2
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 0.0285,
          "tokens": 108128,
          "time": 196.3
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 0.0449,
          "tokens": 180623,
          "time": 133.8
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": false,
          "cost": 0.0889,
          "tokens": 375959,
          "time": 219.9
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 0.0356,
          "tokens": 124571,
          "time": 119.9
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 0.0495,
          "tokens": 173971,
          "time": 174.2
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 0.0198,
          "tokens": 64456,
          "time": 116.3
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 0.0682,
          "tokens": 327162,
          "time": 219.6
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 0.0251,
          "tokens": 85559,
          "time": 134.1
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": false,
          "cost": 0.0337,
          "tokens": 101062,
          "time": 179.9
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": false,
          "cost": 0.0987,
          "tokens": 423482,
          "time": 203.9
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": false,
          "cost": 0.026,
          "tokens": 116641,
          "time": 168.9
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": false,
          "cost": 0.1643,
          "tokens": 1763130,
          "time": 540.4
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 0.0206,
          "tokens": 67603,
          "time": 109.2
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": true,
          "cost": 0.0794,
          "tokens": 456266,
          "time": 247.5
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 0.035,
          "tokens": 133603,
          "time": 179.0
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 0.0931,
          "tokens": 486142,
          "time": 298.6
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": false,
          "cost": 0.0215,
          "tokens": 67182,
          "time": 128.4
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 0.02,
          "tokens": 67701,
          "time": 135.7
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": false,
          "cost": 0.0152,
          "tokens": 47428,
          "time": 90.2
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 0.0298,
          "tokens": 111515,
          "time": 198.6
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": false,
          "cost": 0.0372,
          "tokens": 131438,
          "time": 156.1
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": true,
          "cost": 0.0179,
          "tokens": 53148,
          "time": 118.7
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": false,
          "cost": 0.0095,
          "tokens": 58388,
          "time": 414.7
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 0.048,
          "tokens": 228479,
          "time": 267.8
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": true,
          "cost": 0.0176,
          "tokens": 61387,
          "time": 106.4
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": false,
          "cost": 0.0818,
          "tokens": 359425,
          "time": 255.4
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": true,
          "cost": 0.0322,
          "tokens": 131307,
          "time": 144.9
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": false,
          "cost": 0.0327,
          "tokens": 111917,
          "time": 143.5
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": false,
          "cost": 0.0128,
          "tokens": 45852,
          "time": 87.0
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": false,
          "cost": 0.0642,
          "tokens": 237037,
          "time": 193.6
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": true,
          "cost": 0.0529,
          "tokens": 229100,
          "time": 195.7
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": false,
          "cost": 0.1394,
          "tokens": 518003,
          "time": 418.9
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 0.1029,
          "tokens": 550648,
          "time": 364.6
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 0.0341,
          "tokens": 118936,
          "time": 146.5
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 0.0524,
          "tokens": 173414,
          "time": 185.4
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": false,
          "cost": 0.0296,
          "tokens": 91138,
          "time": 137.3
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 0.0893,
          "tokens": 385762,
          "time": 268.4
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": true,
          "cost": 0.0128,
          "tokens": 43651,
          "time": 114.7
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": false,
          "cost": 0.0517,
          "tokens": 192534,
          "time": 190.3
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": true,
          "cost": 0.0278,
          "tokens": 97620,
          "time": 142.5
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": false,
          "cost": 0.1271,
          "tokens": 519326,
          "time": 326.2
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": false,
          "cost": 0.052,
          "tokens": 192083,
          "time": 199.9
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": false,
          "cost": 0.019,
          "tokens": 61044,
          "time": 128.5
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": false,
          "cost": 0.1235,
          "tokens": 738426,
          "time": 438.6
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": false,
          "cost": 0.0595,
          "tokens": 194774,
          "time": 206.4
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": false,
          "cost": 0.1153,
          "tokens": 680786,
          "time": 371.1
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": true,
          "cost": 0.0998,
          "tokens": 621210,
          "time": 316.2
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": false,
          "cost": 0.0239,
          "tokens": 84344,
          "time": 116.0
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": false,
          "cost": 0.1035,
          "tokens": 147681,
          "time": 555.6
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": true,
          "cost": 0.0412,
          "tokens": 146960,
          "time": 215.4
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 0.0166,
          "tokens": 51774,
          "time": 115.4
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 0.0343,
          "tokens": 117747,
          "time": 173.0
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": false,
          "cost": 0.0212,
          "tokens": 77497,
          "time": 136.7
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": true,
          "cost": 0.0375,
          "tokens": 150608,
          "time": 248.2
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 0.0859,
          "tokens": 394534,
          "time": 239.6
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": false,
          "cost": 0.0368,
          "tokens": 150711,
          "time": 183.4
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 0.0275,
          "tokens": 110492,
          "time": 134.4
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 0.0254,
          "tokens": 78239,
          "time": 141.6
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.0362,
          "tokens": 147885,
          "time": 138.6
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": true,
          "cost": 0.0741,
          "tokens": 296850,
          "time": 207.3
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": false,
          "cost": 0.0413,
          "tokens": 170873,
          "time": 177.9
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": true,
          "cost": 0.0717,
          "tokens": 255468,
          "time": 173.4
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": false,
          "cost": 0.0775,
          "tokens": 295940,
          "time": 324.8
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": true,
          "cost": 0.0497,
          "tokens": 169320,
          "time": 132.1
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": false,
          "cost": 0.0723,
          "tokens": 289452,
          "time": 216.2
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 0.5058,
          "tokens": 1849782,
          "time": 489.4
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": false,
          "cost": 0.0474,
          "tokens": 185942,
          "time": 157.2
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": false,
          "cost": 0.0499,
          "tokens": 284868,
          "time": 319.7
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": false,
          "cost": 0.0177,
          "tokens": 55072,
          "time": 117.8
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 0.0589,
          "tokens": 203238,
          "time": 199.4
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": true,
          "cost": 0.1212,
          "tokens": 344864,
          "time": 541.5
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": true,
          "cost": 0.0316,
          "tokens": 115206,
          "time": 210.6
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": true,
          "cost": 0.0304,
          "tokens": 107003,
          "time": 145.2
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": false,
          "cost": 0.0471,
          "tokens": 197391,
          "time": 129.5
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": true,
          "cost": 0.063,
          "tokens": 252167,
          "time": 190.7
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": true,
          "cost": 0.0681,
          "tokens": 261670,
          "time": 238.7
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": false,
          "cost": 0.0308,
          "tokens": 105571,
          "time": 163.4
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": false,
          "cost": 0.1158,
          "tokens": 572623,
          "time": 370.6
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": false,
          "cost": 0.0941,
          "tokens": 354337,
          "time": 217.1
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": false,
          "cost": 0.0238,
          "tokens": 69506,
          "time": 162.3
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": false,
          "cost": 0.0746,
          "tokens": 298981,
          "time": 204.7
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": false,
          "cost": 0.0301,
          "tokens": 155193,
          "time": 496.1
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": true,
          "cost": 0.0529,
          "tokens": 199226,
          "time": 177.4
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": false,
          "cost": 0.1069,
          "tokens": 575764,
          "time": 276.7
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": false,
          "cost": 0.1179,
          "tokens": 678856,
          "time": 285.5
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": true,
          "cost": 0.0119,
          "tokens": 52113,
          "time": 91.1
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": true,
          "cost": 0.1404,
          "tokens": 630732,
          "time": 279.8
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": false,
          "cost": 0.0201,
          "tokens": 55250,
          "time": 131.2
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": false,
          "cost": 0.0919,
          "tokens": 400780,
          "time": 243.7
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": false,
          "cost": 0.0465,
          "tokens": 175807,
          "time": 125.3
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": false,
          "cost": 0.025,
          "tokens": 84275,
          "time": 123.4
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": true,
          "cost": 0.046,
          "tokens": 196116,
          "time": 145.9
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": false,
          "cost": 0.0209,
          "tokens": 72430,
          "time": 108.6
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": false,
          "cost": 0.0277,
          "tokens": 102101,
          "time": 188.7
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": false,
          "cost": 1.7542,
          "tokens": 6961514,
          "time": 847.7
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": false,
          "cost": 0.1184,
          "tokens": 645136,
          "time": 311.7
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": true,
          "cost": 0.0345,
          "tokens": 125505,
          "time": 130.0
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": true,
          "cost": 0.0588,
          "tokens": 217727,
          "time": 175.4
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": false,
          "cost": 0.0117,
          "tokens": 35677,
          "time": 75.2
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": false,
          "cost": 0.0226,
          "tokens": 68607,
          "time": 120.7
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 0.1348,
          "tokens": 724692,
          "time": 299.4
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 0.0986,
          "tokens": 533990,
          "time": 259.5
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 0.0841,
          "tokens": 300930,
          "time": 139.1
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 0.0183,
          "tokens": 52464,
          "time": 107.8
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": false,
          "cost": 0.0116,
          "tokens": 45018,
          "time": 125.3
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": false,
          "cost": 0.0988,
          "tokens": 429703,
          "time": 225.1
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 0.0135,
          "tokens": 47867,
          "time": 77.2
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": false,
          "cost": 0.0203,
          "tokens": 61542,
          "time": 163.4
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": false,
          "cost": 0.0479,
          "tokens": 184067,
          "time": 182.2
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": false,
          "cost": 0.1311,
          "tokens": 580947,
          "time": 244.4
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": false,
          "cost": 0.1037,
          "tokens": 478110,
          "time": 276.6
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": true,
          "cost": 0.3013,
          "tokens": 1194863,
          "time": 318.8
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": false,
          "cost": 0.0277,
          "tokens": 92465,
          "time": 109.6
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": false,
          "cost": 0.0421,
          "tokens": 163872,
          "time": 169.0
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 0.0436,
          "tokens": 163682,
          "time": 222.2
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 0.0156,
          "tokens": 57968,
          "time": 91.2
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": false,
          "cost": 0.0562,
          "tokens": 197235,
          "time": 209.3
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": false,
          "cost": 0.0254,
          "tokens": 82461,
          "time": 111.5
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": false,
          "cost": 0.0877,
          "tokens": 410504,
          "time": 195.9
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": false,
          "cost": 0.0243,
          "tokens": 77030,
          "time": 141.5
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 0.048,
          "tokens": 169309,
          "time": 144.2
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": false,
          "cost": 0.0395,
          "tokens": 152749,
          "time": 111.2
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 0.0241,
          "tokens": 85008,
          "time": 185.2
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": false,
          "cost": 0.0411,
          "tokens": 142367,
          "time": 146.5
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": true,
          "cost": 0.0491,
          "tokens": 168092,
          "time": 216.7
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": false,
          "cost": 0.0395,
          "tokens": 138931,
          "time": 146.0
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": false,
          "cost": 0.5932,
          "tokens": 2251464,
          "time": 809.3
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": false,
          "cost": 0.0312,
          "tokens": 95093,
          "time": 160.4
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": false,
          "cost": 0.0357,
          "tokens": 134713,
          "time": 192.1
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": false,
          "cost": 0.0456,
          "tokens": 162446,
          "time": 187.2
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 0.0525,
          "tokens": 178715,
          "time": 246.6
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 0.0142,
          "tokens": 42004,
          "time": 106.9
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 0.0707,
          "tokens": 241063,
          "time": 175.3
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": true,
          "cost": 0.0193,
          "tokens": 60607,
          "time": 119.3
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": false,
          "cost": 0.053,
          "tokens": 185524,
          "time": 126.2
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": false,
          "cost": 0.0598,
          "tokens": 219648,
          "time": 164.4
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 0.0739,
          "tokens": 317282,
          "time": 292.8
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": false,
          "cost": 0.0263,
          "tokens": 88919,
          "time": 117.0
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": false,
          "cost": 0.0523,
          "tokens": 174765,
          "time": 219.8
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": false,
          "cost": 0.0361,
          "tokens": 115158,
          "time": 157.9
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": false,
          "cost": 0.1263,
          "tokens": 1108805,
          "time": 570.0
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 0.0454,
          "tokens": 172899,
          "time": 148.4
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": true,
          "cost": 0.0157,
          "tokens": 46562,
          "time": 92.1
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": true,
          "cost": 0.0456,
          "tokens": 190960,
          "time": 143.3
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": true,
          "cost": 0.0559,
          "tokens": 174616,
          "time": 200.1
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": true,
          "cost": 0.023,
          "tokens": 70921,
          "time": 119.7
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": true,
          "cost": 0.0693,
          "tokens": 282182,
          "time": 175.2
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 0.0381,
          "tokens": 142678,
          "time": 121.8
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 0.05,
          "tokens": 235854,
          "time": 151.2
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.0234,
          "tokens": 78855,
          "time": 145.8
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": false,
          "cost": 0.0205,
          "tokens": 56649,
          "time": 144.6
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": false,
          "cost": 0.0218,
          "tokens": 79648,
          "time": 120.0
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": false,
          "cost": 0.6017,
          "tokens": 2149386,
          "time": 837.0
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": true,
          "cost": 0.0956,
          "tokens": 454358,
          "time": 262.3
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": false,
          "cost": 0.0426,
          "tokens": 146305,
          "time": 129.3
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": true,
          "cost": 0.0656,
          "tokens": 286131,
          "time": 215.7
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 0.0748,
          "tokens": 298701,
          "time": 203.4
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": false,
          "cost": 0.0597,
          "tokens": 233856,
          "time": 190.6
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": false,
          "cost": 0.3456,
          "tokens": 1340412,
          "time": 346.9
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": false,
          "cost": 0.0291,
          "tokens": 101208,
          "time": 183.3
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": true,
          "cost": 0.0238,
          "tokens": 77222,
          "time": 110.1
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 0.0193,
          "tokens": 69462,
          "time": 84.6
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": false,
          "cost": 0.0163,
          "tokens": 48526,
          "time": 114.8
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 0.0109,
          "tokens": 32559,
          "time": 82.8
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 0.0151,
          "tokens": 50994,
          "time": 103.2
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 0.0132,
          "tokens": 38172,
          "time": 107.1
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": false,
          "cost": 0.0269,
          "tokens": 87360,
          "time": 108.7
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": false,
          "cost": 0.0951,
          "tokens": 437578,
          "time": 265.7
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 0.0576,
          "tokens": 246106,
          "time": 162.3
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": false,
          "cost": 0.0899,
          "tokens": 337092,
          "time": 228.1
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": false,
          "cost": 1.4817,
          "tokens": 11534620,
          "time": 1048.5
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 0.0449,
          "tokens": 165455,
          "time": 183.1
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 0.0222,
          "tokens": 83022,
          "time": 77.7
        }
      ]
    },
    {
      "runKey": "rag-gpt-5-mini",
      "harness": "trace-rag",
      "model": "gpt-5-mini",
      "modelName": "gpt-5-mini",
      "reported": {
        "cost": 0.023,
        "tokens": 83000,
        "time": 152,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": false,
          "cost": 0.0155,
          "tokens": 44666,
          "time": 101.9
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": false,
          "cost": 0.0276,
          "tokens": 84853,
          "time": 140.7
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": false,
          "cost": 0.0185,
          "tokens": 49467,
          "time": 137.5
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": false,
          "cost": 0.0138,
          "tokens": 45777,
          "time": 67.1
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": false,
          "cost": 0.0316,
          "tokens": 108647,
          "time": 127.4
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": false,
          "cost": 0.0103,
          "tokens": 33753,
          "time": 102.8
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": false,
          "cost": 0.0424,
          "tokens": 139498,
          "time": 124.6
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": true,
          "cost": 0.0155,
          "tokens": 44241,
          "time": 106.6
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": true,
          "cost": 0.0357,
          "tokens": 118880,
          "time": 174.8
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": false,
          "cost": 0.0177,
          "tokens": 50098,
          "time": 101.0
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": false,
          "cost": 0.017,
          "tokens": 52676,
          "time": 86.9
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": false,
          "cost": 0.0355,
          "tokens": 123579,
          "time": 128.3
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": false,
          "cost": 0.0329,
          "tokens": 98728,
          "time": 137.4
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": false,
          "cost": 0.0154,
          "tokens": 49351,
          "time": 56.6
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": false,
          "cost": 0.0304,
          "tokens": 94085,
          "time": 139.8
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": false,
          "cost": 0.0268,
          "tokens": 83920,
          "time": 179.6
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 0.0266,
          "tokens": 89786,
          "time": 213.0
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": true,
          "cost": 0.0214,
          "tokens": 64582,
          "time": 305.3
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": false,
          "cost": 0.0161,
          "tokens": 55903,
          "time": 162.2
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": false,
          "cost": 0.0123,
          "tokens": 35444,
          "time": 270.1
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 0.0392,
          "tokens": 138748,
          "time": 305.9
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": false,
          "cost": 0.0213,
          "tokens": 67078,
          "time": 270.2
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 0.017,
          "tokens": 49110,
          "time": 327.7
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 0.0153,
          "tokens": 45912,
          "time": 163.7
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": false,
          "cost": 0.018,
          "tokens": 48985,
          "time": 176.2
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 0.0294,
          "tokens": 97488,
          "time": 240.6
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": true,
          "cost": 0.0162,
          "tokens": 43705,
          "time": 64.2
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 0.0174,
          "tokens": 56869,
          "time": 212.0
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 0.0261,
          "tokens": 78095,
          "time": 239.4
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 0.0146,
          "tokens": 44429,
          "time": 199.0
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": false,
          "cost": 0.0345,
          "tokens": 107513,
          "time": 236.1
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": false,
          "cost": 0.02,
          "tokens": 66083,
          "time": 178.0
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": false,
          "cost": 0.0424,
          "tokens": 149306,
          "time": 289.7
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": false,
          "cost": 0.0302,
          "tokens": 99244,
          "time": 174.5
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 0.0136,
          "tokens": 35723,
          "time": 306.0
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": false,
          "cost": 0.012,
          "tokens": 34772,
          "time": 194.5
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 0.0279,
          "tokens": 101971,
          "time": 128.1
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 0.0199,
          "tokens": 65620,
          "time": 226.4
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": false,
          "cost": 0.0199,
          "tokens": 52574,
          "time": 139.5
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 0.0211,
          "tokens": 64111,
          "time": 219.5
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": false,
          "cost": 0.0128,
          "tokens": 34750,
          "time": 212.8
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 0.0126,
          "tokens": 35972,
          "time": 293.6
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": false,
          "cost": 0.0194,
          "tokens": 49295,
          "time": 196.1
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": false,
          "cost": 0.0217,
          "tokens": 68896,
          "time": 304.5
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": false,
          "cost": 0.012,
          "tokens": 33230,
          "time": 122.7
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 0.0368,
          "tokens": 132057,
          "time": 91.5
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": false,
          "cost": 0.0178,
          "tokens": 56408,
          "time": 93.0
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": false,
          "cost": 0.027,
          "tokens": 88769,
          "time": 110.0
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": false,
          "cost": 0.0495,
          "tokens": 181116,
          "time": 91.5
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": false,
          "cost": 0.0149,
          "tokens": 47104,
          "time": 112.0
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": false,
          "cost": 0.0125,
          "tokens": 34647,
          "time": 112.6
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": false,
          "cost": 0.0409,
          "tokens": 137786,
          "time": 123.3
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": false,
          "cost": 0.0126,
          "tokens": 35643,
          "time": 96.8
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": false,
          "cost": 0.0551,
          "tokens": 183832,
          "time": 140.8
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 0.0117,
          "tokens": 35799,
          "time": 71.9
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 0.0156,
          "tokens": 50159,
          "time": 85.1
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 0.0147,
          "tokens": 52740,
          "time": 92.1
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": false,
          "cost": 0.0158,
          "tokens": 46036,
          "time": 95.5
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": true,
          "cost": 0.0375,
          "tokens": 127102,
          "time": 105.8
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": true,
          "cost": 0.0108,
          "tokens": 33371,
          "time": 73.3
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": false,
          "cost": 0.0112,
          "tokens": 34189,
          "time": 70.8
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": false,
          "cost": 0.0246,
          "tokens": 80776,
          "time": 314.1
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": false,
          "cost": 0.0557,
          "tokens": 181555,
          "time": 396.6
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": false,
          "cost": 0.0186,
          "tokens": 56185,
          "time": 228.1
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": false,
          "cost": 0.0205,
          "tokens": 68730,
          "time": 304.3
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": true,
          "cost": 0.0147,
          "tokens": 44178,
          "time": 324.4
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": false,
          "cost": 0.0261,
          "tokens": 87343,
          "time": 305.4
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": false,
          "cost": 0.0867,
          "tokens": 303797,
          "time": 294.4
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": false,
          "cost": 0.163,
          "tokens": 622569,
          "time": 345.5
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": false,
          "cost": 0.0172,
          "tokens": 55774,
          "time": 285.2
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": false,
          "cost": 0.0203,
          "tokens": 67007,
          "time": 300.5
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": false,
          "cost": 0.0383,
          "tokens": 120428,
          "time": 354.6
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 0.0183,
          "tokens": 54087,
          "time": 226.8
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 0.0123,
          "tokens": 34238,
          "time": 259.1
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": false,
          "cost": 0.0291,
          "tokens": 80053,
          "time": 285.4
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": true,
          "cost": 0.0136,
          "tokens": 33512,
          "time": 302.1
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 0.0153,
          "tokens": 45491,
          "time": 220.3
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": false,
          "cost": 0.0186,
          "tokens": 55352,
          "time": 163.4
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 0.0204,
          "tokens": 65464,
          "time": 239.1
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 0.0403,
          "tokens": 139051,
          "time": 360.9
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.0318,
          "tokens": 98130,
          "time": 335.5
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": false,
          "cost": 0.0125,
          "tokens": 34437,
          "time": 176.4
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": false,
          "cost": 0.0158,
          "tokens": 37407,
          "time": 280.3
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": true,
          "cost": 0.0135,
          "tokens": 37239,
          "time": 102.7
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": true,
          "cost": 0.0162,
          "tokens": 51679,
          "time": 88.9
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": false,
          "cost": 0.0108,
          "tokens": 31397,
          "time": 89.1
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": true,
          "cost": 0.0323,
          "tokens": 102660,
          "time": 125.3
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 0.0163,
          "tokens": 53343,
          "time": 83.9
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": false,
          "cost": 0.011,
          "tokens": 34863,
          "time": 88.8
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": false,
          "cost": 0.0306,
          "tokens": 107747,
          "time": 87.7
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": false,
          "cost": 0.022,
          "tokens": 71671,
          "time": 129.7
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 0.018,
          "tokens": 54766,
          "time": 168.3
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": true,
          "cost": 0.0124,
          "tokens": 36388,
          "time": 129.3
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": false,
          "cost": 0.0231,
          "tokens": 67390,
          "time": 191.8
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": true,
          "cost": 0.0459,
          "tokens": 157788,
          "time": 195.0
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": false,
          "cost": 0.0292,
          "tokens": 98442,
          "time": 192.2
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": true,
          "cost": 0.0486,
          "tokens": 168002,
          "time": 205.3
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": false,
          "cost": 0.0215,
          "tokens": 63557,
          "time": 201.9
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": false,
          "cost": 0.0128,
          "tokens": 36496,
          "time": 148.8
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": true,
          "cost": 0.0417,
          "tokens": 137209,
          "time": 225.6
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": true,
          "cost": 0.0206,
          "tokens": 67560,
          "time": 207.6
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": false,
          "cost": 0.0377,
          "tokens": 121470,
          "time": 293.6
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": true,
          "cost": 0.0167,
          "tokens": 54835,
          "time": 237.6
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": false,
          "cost": 0.012,
          "tokens": 36213,
          "time": 227.3
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": false,
          "cost": 0.0248,
          "tokens": 80210,
          "time": 250.9
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": false,
          "cost": 0.0126,
          "tokens": 35796,
          "time": 236.3
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": false,
          "cost": 0.0952,
          "tokens": 354008,
          "time": 281.4
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": false,
          "cost": 0.0271,
          "tokens": 89037,
          "time": 262.5
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": false,
          "cost": 0.0119,
          "tokens": 35173,
          "time": 216.7
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": false,
          "cost": 0.0195,
          "tokens": 66922,
          "time": 187.4
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": false,
          "cost": 0.0246,
          "tokens": 76928,
          "time": 195.8
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": false,
          "cost": 0.0093,
          "tokens": 22260,
          "time": 134.9
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": false,
          "cost": 0.0222,
          "tokens": 57942,
          "time": 194.6
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": true,
          "cost": 0.0308,
          "tokens": 97767,
          "time": 191.8
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": true,
          "cost": 0.0422,
          "tokens": 145660,
          "time": 170.6
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": false,
          "cost": 0.0244,
          "tokens": 71740,
          "time": 179.9
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": false,
          "cost": 0.0558,
          "tokens": 198274,
          "time": 180.8
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": false,
          "cost": 0.0372,
          "tokens": 132266,
          "time": 179.9
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": false,
          "cost": 0.0406,
          "tokens": 140518,
          "time": 162.5
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": true,
          "cost": 0.0285,
          "tokens": 95502,
          "time": 160.7
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": false,
          "cost": 0.021,
          "tokens": 61568,
          "time": 166.3
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": false,
          "cost": 0.0168,
          "tokens": 47997,
          "time": 154.6
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 0.0635,
          "tokens": 214068,
          "time": 191.3
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": false,
          "cost": 0.0838,
          "tokens": 304001,
          "time": 164.2
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 0.0264,
          "tokens": 81756,
          "time": 146.6
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 0.025,
          "tokens": 85523,
          "time": 131.4
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": false,
          "cost": 0.0421,
          "tokens": 142082,
          "time": 145.8
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": false,
          "cost": 0.04,
          "tokens": 133843,
          "time": 171.1
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 0.0183,
          "tokens": 60701,
          "time": 115.8
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": false,
          "cost": 0.0155,
          "tokens": 46352,
          "time": 161.6
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": false,
          "cost": 0.0182,
          "tokens": 60107,
          "time": 143.8
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": false,
          "cost": 0.0221,
          "tokens": 77001,
          "time": 115.3
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": false,
          "cost": 0.0302,
          "tokens": 106025,
          "time": 123.3
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": false,
          "cost": 0.0374,
          "tokens": 133987,
          "time": 131.8
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": false,
          "cost": 0.0166,
          "tokens": 57656,
          "time": 109.9
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": false,
          "cost": 0.0401,
          "tokens": 141794,
          "time": 121.9
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 0.0261,
          "tokens": 91125,
          "time": 117.4
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 0.013,
          "tokens": 37463,
          "time": 111.0
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": false,
          "cost": 0.0262,
          "tokens": 86641,
          "time": 108.8
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": false,
          "cost": 0.0178,
          "tokens": 57680,
          "time": 118.3
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": false,
          "cost": 0.0148,
          "tokens": 46779,
          "time": 93.8
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": false,
          "cost": 0.0224,
          "tokens": 71570,
          "time": 88.1
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 0.016,
          "tokens": 52932,
          "time": 64.1
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": false,
          "cost": 0.0196,
          "tokens": 60145,
          "time": 85.9
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 0.0242,
          "tokens": 79512,
          "time": 79.5
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": false,
          "cost": 0.0365,
          "tokens": 115832,
          "time": 114.1
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": false,
          "cost": 0.025,
          "tokens": 82067,
          "time": 97.6
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": false,
          "cost": 0.0407,
          "tokens": 127108,
          "time": 129.1
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": false,
          "cost": 0.0514,
          "tokens": 176484,
          "time": 115.8
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": false,
          "cost": 0.0224,
          "tokens": 69843,
          "time": 85.2
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": false,
          "cost": 0.0258,
          "tokens": 91720,
          "time": 84.5
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": false,
          "cost": 0.0254,
          "tokens": 74066,
          "time": 111.6
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 0.0197,
          "tokens": 56229,
          "time": 98.0
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 0.0149,
          "tokens": 37772,
          "time": 79.2
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 0.0423,
          "tokens": 141289,
          "time": 108.8
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": false,
          "cost": 0.0186,
          "tokens": 64833,
          "time": 61.7
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": false,
          "cost": 0.0242,
          "tokens": 80152,
          "time": 85.7
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": true,
          "cost": 0.0206,
          "tokens": 68653,
          "time": 82.2
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 0.0354,
          "tokens": 123487,
          "time": 82.3
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": false,
          "cost": 0.016,
          "tokens": 53211,
          "time": 58.5
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": false,
          "cost": 0.0399,
          "tokens": 131837,
          "time": 106.3
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": false,
          "cost": 0.0308,
          "tokens": 102197,
          "time": 73.6
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": false,
          "cost": 0.0381,
          "tokens": 115495,
          "time": 106.1
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": true,
          "cost": 0.032,
          "tokens": 105846,
          "time": 78.1
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": false,
          "cost": 0.0121,
          "tokens": 33831,
          "time": 57.0
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": false,
          "cost": 0.039,
          "tokens": 111366,
          "time": 120.0
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": true,
          "cost": 0.0219,
          "tokens": 76207,
          "time": 53.4
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": true,
          "cost": 0.0173,
          "tokens": 56003,
          "time": 55.3
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": false,
          "cost": 0.0342,
          "tokens": 100314,
          "time": 99.9
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": true,
          "cost": 0.0351,
          "tokens": 114795,
          "time": 76.5
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": true,
          "cost": 0.034,
          "tokens": 116058,
          "time": 70.3
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.015,
          "tokens": 47565,
          "time": 49.6
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": false,
          "cost": 0.0341,
          "tokens": 111893,
          "time": 74.0
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": false,
          "cost": 0.0179,
          "tokens": 50352,
          "time": 61.3
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": false,
          "cost": 0.0204,
          "tokens": 69751,
          "time": 49.4
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": false,
          "cost": 0.0229,
          "tokens": 71421,
          "time": 61.7
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": true,
          "cost": 0.0185,
          "tokens": 53478,
          "time": 54.0
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": true,
          "cost": 0.0242,
          "tokens": 83114,
          "time": 46.8
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 0.0145,
          "tokens": 38534,
          "time": 50.0
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": true,
          "cost": 0.0197,
          "tokens": 66018,
          "time": 48.9
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": true,
          "cost": 0.0277,
          "tokens": 82842,
          "time": 75.9
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": true,
          "cost": 0.0183,
          "tokens": 46162,
          "time": 70.2
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": false,
          "cost": 0.0106,
          "tokens": 33452,
          "time": 40.5
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 0.0152,
          "tokens": 44102,
          "time": 53.9
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": false,
          "cost": 0.0103,
          "tokens": 32961,
          "time": 38.6
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 0.0195,
          "tokens": 50436,
          "time": 71.9
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 0.0164,
          "tokens": 46130,
          "time": 55.1
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 0.0207,
          "tokens": 65059,
          "time": 43.8
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": false,
          "cost": 0.0265,
          "tokens": 83577,
          "time": 59.0
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": true,
          "cost": 0.0192,
          "tokens": 59472,
          "time": 51.2
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 0.0171,
          "tokens": 50909,
          "time": 45.3
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": false,
          "cost": 0.0155,
          "tokens": 45921,
          "time": 54.3
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": true,
          "cost": 0.0145,
          "tokens": 45540,
          "time": 56.5
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 0.0175,
          "tokens": 47910,
          "time": 61.4
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 0.0165,
          "tokens": 45230,
          "time": 52.1
        }
      ]
    },
    {
      "runKey": "rag-gemini-3.5-flash",
      "harness": "trace-rag",
      "model": "gemini-3.5-flash",
      "modelName": "gemini-3.5-flash",
      "reported": {
        "cost": 0.273,
        "tokens": 269000,
        "time": 147,
        "tokensEstimated": false
      },
      "cases": [
        {
          "task": "108-24-no-recording-sessions-policy-v0",
          "passed": false,
          "cost": 0.2041,
          "tokens": 124304,
          "time": 119.3
        },
        {
          "task": "108-24-no-recording-sessions-policy-v1",
          "passed": false,
          "cost": 0.1989,
          "tokens": 124093,
          "time": 136.0
        },
        {
          "task": "108-24-no-recording-sessions-policy-v2",
          "passed": false,
          "cost": 0.5009,
          "tokens": 326533,
          "time": 118.1
        },
        {
          "task": "108-24-no-recording-sessions-policy-v3",
          "passed": false,
          "cost": 0.6018,
          "tokens": 394943,
          "time": 57.1
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v0",
          "passed": false,
          "cost": 0.1942,
          "tokens": 125294,
          "time": 84.2
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v1",
          "passed": true,
          "cost": 0.582,
          "tokens": 362679,
          "time": 188.2
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v2",
          "passed": false,
          "cost": 0.623,
          "tokens": 400640,
          "time": 122.0
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v3",
          "passed": false,
          "cost": 0.4127,
          "tokens": 269578,
          "time": 117.3
        },
        {
          "task": "108-25-sibling-name-disambiguation-holden-hayden-v4",
          "passed": false,
          "cost": 0.7538,
          "tokens": 167231,
          "time": 253.2
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v0",
          "passed": false,
          "cost": 0.6132,
          "tokens": 403631,
          "time": 75.1
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v1",
          "passed": false,
          "cost": 0.7654,
          "tokens": 485099,
          "time": 115.3
        },
        {
          "task": "108-46-math-only-service-scope-progressive-timeline-v2",
          "passed": false,
          "cost": 0.4433,
          "tokens": 290670,
          "time": 63.2
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v0",
          "passed": false,
          "cost": 0.6109,
          "tokens": 391623,
          "time": 108.3
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v1",
          "passed": false,
          "cost": 0.6851,
          "tokens": 442761,
          "time": 66.0
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v2",
          "passed": false,
          "cost": 0.7344,
          "tokens": 483259,
          "time": 130.2
        },
        {
          "task": "108-47-ai-disclosure-to-teachers-v3",
          "passed": false,
          "cost": 0.8585,
          "tokens": 558315,
          "time": 64.6
        },
        {
          "task": "180-08-no-chrome-use-safari-v1",
          "passed": false,
          "cost": 0.6686,
          "tokens": 435466,
          "time": 318.4
        },
        {
          "task": "180-08-no-chrome-use-safari-v2",
          "passed": false,
          "cost": 0.2687,
          "tokens": 165653,
          "time": 292.7
        },
        {
          "task": "180-09-brother-nastori-recall-v0",
          "passed": false,
          "cost": 0.6504,
          "tokens": 422213,
          "time": 175.2
        },
        {
          "task": "180-09-brother-nastori-recall-v1",
          "passed": false,
          "cost": 0.2567,
          "tokens": 166891,
          "time": 307.9
        },
        {
          "task": "180-09-brother-nastori-recall-v3",
          "passed": false,
          "cost": 0.642,
          "tokens": 419382,
          "time": 323.1
        },
        {
          "task": "180-10-parent-override-directive-v0",
          "passed": false,
          "cost": 0.527,
          "tokens": 342915,
          "time": 333.4
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v0",
          "passed": false,
          "cost": 0.5985,
          "tokens": 387308,
          "time": 131.6
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v1",
          "passed": false,
          "cost": 0.1555,
          "tokens": 100179,
          "time": 277.4
        },
        {
          "task": "180-11-joe-louis-specific-project-recall-v2",
          "passed": true,
          "cost": 0.5843,
          "tokens": 377798,
          "time": 316.4
        },
        {
          "task": "180-38-space-interest-not-animal-v0",
          "passed": false,
          "cost": 0.0835,
          "tokens": 53041,
          "time": 243.7
        },
        {
          "task": "180-38-space-interest-not-animal-v1",
          "passed": false,
          "cost": 0.4792,
          "tokens": 299176,
          "time": 340.6
        },
        {
          "task": "180-38-space-interest-not-animal-v2",
          "passed": false,
          "cost": 0.5188,
          "tokens": 339220,
          "time": 101.8
        },
        {
          "task": "180-38-space-interest-not-animal-v3",
          "passed": false,
          "cost": 0.1337,
          "tokens": 84578,
          "time": 278.0
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v1",
          "passed": false,
          "cost": 0.1387,
          "tokens": 88156,
          "time": 220.7
        },
        {
          "task": "180-39-vietnamese-glosses-permission-v2",
          "passed": false,
          "cost": 0.5898,
          "tokens": 383429,
          "time": 143.1
        },
        {
          "task": "180-41-vocab-batch-tracking-v0",
          "passed": false,
          "cost": 0.3974,
          "tokens": 256311,
          "time": 316.8
        },
        {
          "task": "180-41-vocab-batch-tracking-v1",
          "passed": false,
          "cost": 0.338,
          "tokens": 220731,
          "time": 282.6
        },
        {
          "task": "180-41-vocab-batch-tracking-v2",
          "passed": false,
          "cost": 0.5744,
          "tokens": 377103,
          "time": 308.4
        },
        {
          "task": "180-41-vocab-batch-tracking-v3",
          "passed": false,
          "cost": 1.0372,
          "tokens": 678369,
          "time": 330.4
        },
        {
          "task": "197-48-weekly-subject-schedule-v0",
          "passed": false,
          "cost": 0.5591,
          "tokens": 346712,
          "time": 254.8
        },
        {
          "task": "197-48-weekly-subject-schedule-v4",
          "passed": false,
          "cost": 0.4328,
          "tokens": 281749,
          "time": 193.4
        },
        {
          "task": "197-49-test-format-question-count-v0",
          "passed": false,
          "cost": 0.4614,
          "tokens": 299497,
          "time": 139.2
        },
        {
          "task": "197-49-test-format-question-count-v1",
          "passed": false,
          "cost": 0.6405,
          "tokens": 419142,
          "time": 316.8
        },
        {
          "task": "197-49-test-format-question-count-v2",
          "passed": false,
          "cost": 0.8847,
          "tokens": 578570,
          "time": 216.9
        },
        {
          "task": "197-49-test-format-question-count-v3",
          "passed": false,
          "cost": 0.4677,
          "tokens": 301182,
          "time": 272.3
        },
        {
          "task": "197-49-test-format-question-count-v4",
          "passed": false,
          "cost": 0.5384,
          "tokens": 347952,
          "time": 236.7
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v0",
          "passed": false,
          "cost": 0.3358,
          "tokens": 220352,
          "time": 111.2
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v1",
          "passed": false,
          "cost": 0.0546,
          "tokens": 33748,
          "time": 331.7
        },
        {
          "task": "197-51-eighty-percent-word-problem-mix-v4",
          "passed": false,
          "cost": 0.4325,
          "tokens": 275337,
          "time": 321.8
        },
        {
          "task": "202-84-ela-report-card-link-recency-v1",
          "passed": false,
          "cost": 0.2415,
          "tokens": 149445,
          "time": 78.9
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v0",
          "passed": false,
          "cost": 1.2524,
          "tokens": 803558,
          "time": 71.2
        },
        {
          "task": "202-85-homework-song-titles-fidelity-v2",
          "passed": true,
          "cost": 0.4826,
          "tokens": 285929,
          "time": 133.4
        },
        {
          "task": "214-30-original-scope-recall-v0",
          "passed": false,
          "cost": 0.5227,
          "tokens": 342913,
          "time": 47.9
        },
        {
          "task": "214-30-original-scope-recall-v2",
          "passed": false,
          "cost": 0.5529,
          "tokens": 355895,
          "time": 130.4
        },
        {
          "task": "214-30-original-scope-recall-v3",
          "passed": false,
          "cost": 0.6247,
          "tokens": 407933,
          "time": 113.4
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v0",
          "passed": false,
          "cost": 0.8894,
          "tokens": 578012,
          "time": 168.0
        },
        {
          "task": "214-97-operator-pause-until-paid-upgrade-v1",
          "passed": false,
          "cost": 0.7621,
          "tokens": 501865,
          "time": 78.3
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v2",
          "passed": false,
          "cost": 0.6821,
          "tokens": 436298,
          "time": 109.6
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v3",
          "passed": false,
          "cost": 0.3346,
          "tokens": 214651,
          "time": 56.8
        },
        {
          "task": "216-22-wednesday-extended-slot-progressive-v4",
          "passed": false,
          "cost": 0.9833,
          "tokens": 316957,
          "time": 225.8
        },
        {
          "task": "216-23-45-min-session-length-commitment-v0",
          "passed": true,
          "cost": 0.6016,
          "tokens": 387229,
          "time": 75.7
        },
        {
          "task": "216-23-45-min-session-length-commitment-v1",
          "passed": false,
          "cost": 0.5669,
          "tokens": 366083,
          "time": 121.9
        },
        {
          "task": "216-23-45-min-session-length-commitment-v2",
          "passed": false,
          "cost": 0.5856,
          "tokens": 382479,
          "time": 70.5
        },
        {
          "task": "216-23-45-min-session-length-commitment-v3",
          "passed": true,
          "cost": 0.2165,
          "tokens": 133602,
          "time": 89.6
        },
        {
          "task": "216-23-45-min-session-length-commitment-v4",
          "passed": false,
          "cost": 0.4425,
          "tokens": 274380,
          "time": 85.5
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v0",
          "passed": false,
          "cost": 0.8898,
          "tokens": 571572,
          "time": 320.8
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v1",
          "passed": false,
          "cost": 0.135,
          "tokens": 84021,
          "time": 301.5
        },
        {
          "task": "219-73-juliana-is-the-parent-adult-learner-v2",
          "passed": false,
          "cost": 0.2112,
          "tokens": 129840,
          "time": 226.1
        },
        {
          "task": "219-76-department-of-war-not-defense-v3",
          "passed": false,
          "cost": 0.4949,
          "tokens": 323537,
          "time": 162.3
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v0",
          "passed": true,
          "cost": 0.3976,
          "tokens": 255671,
          "time": 282.5
        },
        {
          "task": "219-86-lecun-feifei-researcher-pair-v2",
          "passed": false,
          "cost": 0.5159,
          "tokens": 331263,
          "time": 349.7
        },
        {
          "task": "219-87-gavin-logout-was-parent-device-switch-v0",
          "passed": false,
          "cost": 1.1535,
          "tokens": 740361,
          "time": 324.8
        },
        {
          "task": "219-89-earth-day-totoro-spec-v0",
          "passed": false,
          "cost": 0.2219,
          "tokens": 142284,
          "time": 278.0
        },
        {
          "task": "219-89-earth-day-totoro-spec-v1",
          "passed": true,
          "cost": 0.4244,
          "tokens": 263115,
          "time": 194.2
        },
        {
          "task": "219-89-earth-day-totoro-spec-v2",
          "passed": false,
          "cost": 0.2968,
          "tokens": 192506,
          "time": 323.9
        },
        {
          "task": "219-89-earth-day-totoro-spec-v3",
          "passed": false,
          "cost": 0.2991,
          "tokens": 195219,
          "time": 225.1
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v0",
          "passed": false,
          "cost": 0.3585,
          "tokens": 232107,
          "time": 288.2
        },
        {
          "task": "268-69-aditi-30-minute-sessions-v2",
          "passed": false,
          "cost": 0.4332,
          "tokens": 276550,
          "time": 326.8
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v2",
          "passed": false,
          "cost": 0.5893,
          "tokens": 380556,
          "time": 334.8
        },
        {
          "task": "268-72-pia-traveling-overseas-india-v3",
          "passed": false,
          "cost": 0.3445,
          "tokens": 215667,
          "time": 349.0
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v0",
          "passed": false,
          "cost": 0.7542,
          "tokens": 496791,
          "time": 174.2
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v1",
          "passed": false,
          "cost": 0.561,
          "tokens": 366763,
          "time": 143.5
        },
        {
          "task": "268-91-module-6-two-step-equations-wednesday-test-v2",
          "passed": false,
          "cost": 0.2934,
          "tokens": 185216,
          "time": 189.4
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v0",
          "passed": true,
          "cost": 0.3078,
          "tokens": 196244,
          "time": 306.6
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v1",
          "passed": true,
          "cost": 0.276,
          "tokens": 176743,
          "time": 245.1
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v2",
          "passed": false,
          "cost": 0.5914,
          "tokens": 389881,
          "time": 301.8
        },
        {
          "task": "268-92-amc8-test-date-jan-25-2026-v3",
          "passed": false,
          "cost": 0.5008,
          "tokens": 325485,
          "time": 298.6
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v0",
          "passed": false,
          "cost": 0.5,
          "tokens": 325631,
          "time": 110.8
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v1",
          "passed": false,
          "cost": 0.385,
          "tokens": 242979,
          "time": 61.3
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v2",
          "passed": false,
          "cost": 0.1108,
          "tokens": 67795,
          "time": 72.0
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v3",
          "passed": false,
          "cost": 0.504,
          "tokens": 329876,
          "time": 132.8
        },
        {
          "task": "294-52-chloe-regular-slot-mwf-430-v4",
          "passed": false,
          "cost": 0.6969,
          "tokens": 444175,
          "time": 93.1
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v0",
          "passed": false,
          "cost": 0.3348,
          "tokens": 214827,
          "time": 137.2
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v1",
          "passed": true,
          "cost": 1.1583,
          "tokens": 758244,
          "time": 107.6
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v2",
          "passed": false,
          "cost": 0.263,
          "tokens": 171218,
          "time": 98.8
        },
        {
          "task": "294-53-carmindy-precal-not-trig-v3",
          "passed": false,
          "cost": 0.2304,
          "tokens": 149041,
          "time": 83.5
        },
        {
          "task": "294-54-williams-referral-code-v0",
          "passed": true,
          "cost": 0.2079,
          "tokens": 131161,
          "time": 246.3
        },
        {
          "task": "294-54-williams-referral-code-v1",
          "passed": false,
          "cost": 0.0768,
          "tokens": 46556,
          "time": 140.7
        },
        {
          "task": "294-54-williams-referral-code-v2",
          "passed": true,
          "cost": 0.1133,
          "tokens": 67223,
          "time": 141.2
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v0",
          "passed": false,
          "cost": 0.104,
          "tokens": 64025,
          "time": 77.6
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v1",
          "passed": true,
          "cost": 0.2261,
          "tokens": 140585,
          "time": 138.8
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v2",
          "passed": false,
          "cost": 0.1596,
          "tokens": 101485,
          "time": 85.0
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v3",
          "passed": false,
          "cost": 0.1536,
          "tokens": 94376,
          "time": 92.4
        },
        {
          "task": "294-80-carmindy-tue-thu-345-415-v4",
          "passed": false,
          "cost": 0.8479,
          "tokens": 233726,
          "time": 295.1
        },
        {
          "task": "304-12-test-mode-directive-recall-v0",
          "passed": false,
          "cost": 1.2945,
          "tokens": 856751,
          "time": 225.6
        },
        {
          "task": "304-12-test-mode-directive-recall-v1",
          "passed": false,
          "cost": 1.2281,
          "tokens": 492974,
          "time": 465.1
        },
        {
          "task": "304-12-test-mode-directive-recall-v2",
          "passed": false,
          "cost": 1.3112,
          "tokens": 550928,
          "time": 389.4
        },
        {
          "task": "304-12-test-mode-directive-recall-v3",
          "passed": false,
          "cost": 0.3276,
          "tokens": 215011,
          "time": 149.6
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v0",
          "passed": false,
          "cost": 0.6146,
          "tokens": 401757,
          "time": 224.6
        },
        {
          "task": "304-13-stale-schedule-vs-actual-pattern-v3",
          "passed": false,
          "cost": 0.5787,
          "tokens": 378720,
          "time": 226.1
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v0",
          "passed": false,
          "cost": 1.1614,
          "tokens": 770452,
          "time": 236.6
        },
        {
          "task": "304-14-numerator-denominator-taxonomy-v2",
          "passed": false,
          "cost": 0.273,
          "tokens": 178042,
          "time": 395.8
        },
        {
          "task": "304-15-shadow-compass-remediation-v0",
          "passed": true,
          "cost": 0.2546,
          "tokens": 154990,
          "time": 219.7
        },
        {
          "task": "304-15-shadow-compass-remediation-v1",
          "passed": false,
          "cost": 0.3763,
          "tokens": 245334,
          "time": 201.8
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v0",
          "passed": false,
          "cost": 0.317,
          "tokens": 202371,
          "time": 169.6
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v1",
          "passed": false,
          "cost": 0.2228,
          "tokens": 143682,
          "time": 166.2
        },
        {
          "task": "350-34-mon-thu-5pm-schedule-correction-v3",
          "passed": false,
          "cost": 0.4124,
          "tokens": 268527,
          "time": 157.2
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v0",
          "passed": false,
          "cost": 0.3873,
          "tokens": 251207,
          "time": 166.6
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v1",
          "passed": true,
          "cost": 0.5095,
          "tokens": 324410,
          "time": 166.8
        },
        {
          "task": "350-94-teacher-mrs-teasley-walnut-grove-kayle-v3",
          "passed": false,
          "cost": 0.5745,
          "tokens": 374232,
          "time": 180.4
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v0",
          "passed": false,
          "cost": 0.6948,
          "tokens": 456770,
          "time": 149.0
        },
        {
          "task": "350-95-karter-fractions-test-score-84-v1",
          "passed": false,
          "cost": 0.8132,
          "tokens": 536483,
          "time": 155.4
        },
        {
          "task": "350-96-parent-name-mrs-marsha-suggs-v0",
          "passed": false,
          "cost": 1.2768,
          "tokens": 832702,
          "time": 163.6
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v2",
          "passed": false,
          "cost": 0.4579,
          "tokens": 297228,
          "time": 153.8
        },
        {
          "task": "367-61-teaching-textbooks-pre-algebra-v3",
          "passed": false,
          "cost": 0.4048,
          "tokens": 259609,
          "time": 153.6
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v0",
          "passed": false,
          "cost": 0.3845,
          "tokens": 250357,
          "time": 171.0
        },
        {
          "task": "367-62-mon-10-tue-fri-11-schedule-v3",
          "passed": false,
          "cost": 0.4613,
          "tokens": 295983,
          "time": 118.3
        },
        {
          "task": "367-63-subscription-paused-march-7-v0",
          "passed": true,
          "cost": 0.3963,
          "tokens": 255785,
          "time": 112.8
        },
        {
          "task": "367-63-subscription-paused-march-7-v1",
          "passed": true,
          "cost": 0.1169,
          "tokens": 67784,
          "time": 112.2
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v1",
          "passed": false,
          "cost": 0.6254,
          "tokens": 410376,
          "time": 127.3
        },
        {
          "task": "367-64-riley-curriculum-mastery-level-v2",
          "passed": false,
          "cost": 0.738,
          "tokens": 475460,
          "time": 121.2
        },
        {
          "task": "699-55b-use-benaiah-when-writing-ABOUT-him-formally-v1",
          "passed": false,
          "cost": 0.7285,
          "tokens": 470179,
          "time": 96.1
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v0",
          "passed": false,
          "cost": 0.3938,
          "tokens": 249402,
          "time": 105.2
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v1",
          "passed": false,
          "cost": 0.3044,
          "tokens": 191279,
          "time": 101.8
        },
        {
          "task": "699-56-nephew-add-to-existing-account-bryan-override-v3",
          "passed": false,
          "cost": 0.2202,
          "tokens": 134633,
          "time": 84.9
        },
        {
          "task": "699-78-parent-is-guardian-not-biological-mother-v3",
          "passed": false,
          "cost": 0.2497,
          "tokens": 153461,
          "time": 102.7
        },
        {
          "task": "719-32-standing-630-pm-schedule-v0",
          "passed": true,
          "cost": 0.5558,
          "tokens": 359944,
          "time": 99.0
        },
        {
          "task": "719-32-standing-630-pm-schedule-v1",
          "passed": true,
          "cost": 0.7501,
          "tokens": 480794,
          "time": 92.8
        },
        {
          "task": "719-32-standing-630-pm-schedule-v2",
          "passed": false,
          "cost": 0.3893,
          "tokens": 243451,
          "time": 86.2
        },
        {
          "task": "719-32-standing-630-pm-schedule-v3",
          "passed": false,
          "cost": 0.4069,
          "tokens": 263161,
          "time": 77.9
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v0",
          "passed": false,
          "cost": 0.4463,
          "tokens": 292770,
          "time": 72.2
        },
        {
          "task": "719-33-test-rescheduled-to-monday-v3",
          "passed": false,
          "cost": 0.3478,
          "tokens": 220083,
          "time": 79.1
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v0",
          "passed": true,
          "cost": 0.8198,
          "tokens": 220369,
          "time": 300.5
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v1",
          "passed": true,
          "cost": 0.4057,
          "tokens": 258899,
          "time": 64.9
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v2",
          "passed": false,
          "cost": 0.1822,
          "tokens": 101166,
          "time": 76.0
        },
        {
          "task": "732-36-wednesday-5pm-youth-group-override-732-v3",
          "passed": true,
          "cost": 0.3035,
          "tokens": 172658,
          "time": 82.0
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v0",
          "passed": false,
          "cost": 0.3996,
          "tokens": 260661,
          "time": 58.3
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v1",
          "passed": false,
          "cost": 0.629,
          "tokens": 405486,
          "time": 77.2
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v3",
          "passed": false,
          "cost": 0.3218,
          "tokens": 196429,
          "time": 76.0
        },
        {
          "task": "732-93-tue-thu-reading-30-writing-20-split-v4",
          "passed": false,
          "cost": 0.634,
          "tokens": 410156,
          "time": 63.4
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v0",
          "passed": false,
          "cost": 0.1369,
          "tokens": 86920,
          "time": 61.1
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v1",
          "passed": false,
          "cost": 0.1918,
          "tokens": 122724,
          "time": 72.0
        },
        {
          "task": "745-57-last-kids-on-earth-book-series-v3",
          "passed": false,
          "cost": 0.1352,
          "tokens": 85691,
          "time": 59.9
        },
        {
          "task": "745-58-business-name-mini-moments-v0",
          "passed": false,
          "cost": 0.2966,
          "tokens": 192598,
          "time": 43.1
        },
        {
          "task": "745-58-business-name-mini-moments-v2",
          "passed": false,
          "cost": 0.3488,
          "tokens": 226531,
          "time": 58.9
        },
        {
          "task": "745-59-sessions-mix-in-other-subjects-v1",
          "passed": false,
          "cost": 0.1855,
          "tokens": 117785,
          "time": 61.7
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v0",
          "passed": false,
          "cost": 0.0994,
          "tokens": 62479,
          "time": 53.2
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v2",
          "passed": false,
          "cost": 0.1489,
          "tokens": 95623,
          "time": 49.0
        },
        {
          "task": "745-60-douglas-homework-1-to-15-and-28-29-v3",
          "passed": false,
          "cost": 0.1919,
          "tokens": 122357,
          "time": 56.6
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v0",
          "passed": false,
          "cost": 0.1303,
          "tokens": 83197,
          "time": 51.6
        },
        {
          "task": "745-81-behavior-reporting-to-therapist-v1",
          "passed": false,
          "cost": 0.1907,
          "tokens": 121763,
          "time": 51.5
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v1",
          "passed": false,
          "cost": 0.6487,
          "tokens": 115420,
          "time": 222.2
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v4",
          "passed": false,
          "cost": 0.1281,
          "tokens": 81474,
          "time": 52.7
        },
        {
          "task": "745-82-doug-tired-claim-is-avoidance-v5",
          "passed": false,
          "cost": 0.206,
          "tokens": 126870,
          "time": 54.3
        },
        {
          "task": "745-83-no-repitch-human-tutor-v0",
          "passed": false,
          "cost": 0.7406,
          "tokens": 484836,
          "time": 59.5
        },
        {
          "task": "745-83-no-repitch-human-tutor-v1",
          "passed": false,
          "cost": 0.1491,
          "tokens": 95597,
          "time": 52.9
        },
        {
          "task": "745-83-no-repitch-human-tutor-v4",
          "passed": false,
          "cost": 0.1506,
          "tokens": 95625,
          "time": 47.8
        },
        {
          "task": "804-27-referral-link-cantave-v0",
          "passed": false,
          "cost": 0.2838,
          "tokens": 176693,
          "time": 52.0
        },
        {
          "task": "804-27-referral-link-cantave-v1",
          "passed": false,
          "cost": 0.3369,
          "tokens": 220161,
          "time": 35.6
        },
        {
          "task": "804-27-referral-link-cantave-v2",
          "passed": false,
          "cost": 0.2285,
          "tokens": 146493,
          "time": 46.9
        },
        {
          "task": "804-27-referral-link-cantave-v3",
          "passed": false,
          "cost": 0.4074,
          "tokens": 249608,
          "time": 54.6
        },
        {
          "task": "804-27-referral-link-cantave-v4",
          "passed": false,
          "cost": 0.2758,
          "tokens": 175259,
          "time": 45.9
        },
        {
          "task": "804-28-parent-email-icloud-recall-v0",
          "passed": false,
          "cost": 0.2142,
          "tokens": 135615,
          "time": 51.6
        },
        {
          "task": "804-28-parent-email-icloud-recall-v1",
          "passed": false,
          "cost": 0.2344,
          "tokens": 148453,
          "time": 45.9
        },
        {
          "task": "804-28-parent-email-icloud-recall-v2",
          "passed": false,
          "cost": 0.3163,
          "tokens": 202223,
          "time": 44.7
        },
        {
          "task": "804-28-parent-email-icloud-recall-v3",
          "passed": true,
          "cost": 0.1912,
          "tokens": 121354,
          "time": 43.7
        },
        {
          "task": "804-28-parent-email-icloud-recall-v4",
          "passed": false,
          "cost": 0.3044,
          "tokens": 191160,
          "time": 49.9
        },
        {
          "task": "804-42-cj-pronouns-he-him-v2",
          "passed": false,
          "cost": 0.1565,
          "tokens": 96623,
          "time": 45.5
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v3",
          "passed": false,
          "cost": 0.0711,
          "tokens": 43852,
          "time": 37.2
        },
        {
          "task": "804-43-cj-christina-twin-disambiguation-v4",
          "passed": false,
          "cost": 0.1954,
          "tokens": 125064,
          "time": 40.8
        },
        {
          "task": "857-66-rome-project-what-romans-ate-v0",
          "passed": true,
          "cost": 0.4657,
          "tokens": 300580,
          "time": 39.0
        },
        {
          "task": "857-67-parent-name-sabrina-lebron-v0",
          "passed": true,
          "cost": 0.1308,
          "tokens": 81973,
          "time": 33.8
        },
        {
          "task": "857-68-move-on-from-fraction-addition-v0",
          "passed": false,
          "cost": 0.1417,
          "tokens": 89961,
          "time": 31.3
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v0",
          "passed": false,
          "cost": 0.3224,
          "tokens": 208533,
          "time": 35.8
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v1",
          "passed": false,
          "cost": 0.1242,
          "tokens": 79071,
          "time": 33.8
        },
        {
          "task": "945-07a-use-abby-when-writing-TO-her-v2",
          "passed": false,
          "cost": 0.176,
          "tokens": 113932,
          "time": 34.6
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v1",
          "passed": false,
          "cost": 0.3553,
          "tokens": 230644,
          "time": 42.8
        },
        {
          "task": "945-07b-use-abby-when-writing-ABOUT-her-to-3rd-parties-v2",
          "passed": false,
          "cost": 0.2652,
          "tokens": 172983,
          "time": 33.3
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v0",
          "passed": false,
          "cost": 0.1719,
          "tokens": 111085,
          "time": 32.5
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v1",
          "passed": false,
          "cost": 0.2118,
          "tokens": 135038,
          "time": 35.6
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v2",
          "passed": false,
          "cost": 0.3702,
          "tokens": 242410,
          "time": 36.0
        },
        {
          "task": "945-44-subject-exclusion-foreign-language-v3",
          "passed": false,
          "cost": 0.166,
          "tokens": 106528,
          "time": 33.6
        },
        {
          "task": "945-45-specific-named-speech-goals-v0",
          "passed": false,
          "cost": 0.3216,
          "tokens": 208243,
          "time": 38.1
        },
        {
          "task": "945-45-specific-named-speech-goals-v1",
          "passed": false,
          "cost": 0.4141,
          "tokens": 266438,
          "time": 197.4
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v0",
          "passed": false,
          "cost": 0.1397,
          "tokens": 85361,
          "time": 35.2
        },
        {
          "task": "945-98-grandfathered-pricing-with-cascading-patches-v1",
          "passed": false,
          "cost": 0.2453,
          "tokens": 155816,
          "time": 36.2
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v0",
          "passed": false,
          "cost": 0.1643,
          "tokens": 105982,
          "time": 31.7
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v1",
          "passed": false,
          "cost": 0.1821,
          "tokens": 115965,
          "time": 34.4
        },
        {
          "task": "945-99-session-subject-4-item-closed-scope-v2",
          "passed": false,
          "cost": 0.251,
          "tokens": 163356,
          "time": 33.3
        }
      ]
    }
  ]
}
