STET

run_metadata

runs/2026-02-28__13-38-10__gpt-5-3-codex/run_metadata.json

1634 bytes

Back to adjudication
{
  "run_id": "2026-02-28__13-38-10__gpt-5-3-codex",
  "uuid": "f016c196-14e4-422c-bb38-a929de026e67",
  "dataset_path": "/Users/ben/dev/flux/.tmp/graphql-go-tools-dataset",
  "dataset_name": null,
  "dataset_version": null,
  "output_path": "/Users/ben/dev/flux/.tmp/h2h-graphql-w2/runs",
  "agent_name": "codex",
  "no_rebuild": false,
  "cleanup": true,
  "log_level": 20,
  "task_ids": [
    "flux-pr-1380",
    "flux-pr-1240",
    "flux-pr-1155",
    "flux-pr-1309",
    "flux-pr-1232",
    "flux-pr-1308",
    "flux-pr-1128",
    "flux-pr-1184",
    "flux-pr-1260",
    "flux-pr-891",
    "flux-pr-1297",
    "flux-pr-1351",
    "flux-pr-1099",
    "flux-pr-1087",
    "flux-pr-859",
    "flux-pr-1209",
    "flux-pr-1169",
    "flux-pr-1230",
    "flux-pr-1034",
    "flux-pr-1076",
    "flux-pr-1338",
    "flux-pr-817",
    "flux-pr-870",
    "flux-pr-828",
    "flux-pr-1001",
    "flux-pr-1268",
    "flux-pr-1241",
    "flux-pr-1262",
    "flux-pr-1293"
  ],
  "exclude_task_ids": null,
  "n_tasks": null,
  "n_concurrent_trials": 4,
  "n_attempts": 1,
  "dataset_size": 29,
  "accuracy": 0.896551724137931,
  "model_name": "gpt-5.3-codex",
  "start_time": "2026-02-28T13:38:12.733292+00:00",
  "end_time": "2026-02-28T14:43:03.470912+00:00",
  "commit_hash": "99ae882e59281de74856a3e7eeb1b7c986b466af",
  "username": "benredmond",
  "s3_bucket": null,
  "reasoning_effort": "medium",
  "agent_kwargs": null,
  "pass_at_k": {},
  "resumed_at": null
}