STET

run_metadata

runs/2026-02-21__03-36-16__gpt-5-1-codex-mini/run_metadata.json

1681 bytes

Back to adjudication
{
  "run_id": "2026-02-21__03-36-16__gpt-5-1-codex-mini",
  "uuid": "2b8f580d-fa06-43de-b6f9-5fc07c5af93f",
  "dataset_path": "/Users/ben/dev/flux/.tmp/sqlparser-rs-dataset",
  "dataset_name": null,
  "dataset_version": null,
  "output_path": "/Users/ben/dev/flux/.tmp/h2h-sqlparser-flu77-mini/runs",
  "agent_name": "codex",
  "no_rebuild": false,
  "cleanup": true,
  "log_level": 20,
  "task_ids": [
    "flux-pr-1791",
    "flux-pr-1839",
    "flux-pr-2148",
    "flux-pr-1759",
    "flux-pr-2172",
    "flux-pr-1891",
    "flux-pr-1435",
    "flux-pr-1526",
    "flux-pr-1747",
    "flux-pr-1441",
    "flux-pr-2151",
    "flux-pr-1604",
    "flux-pr-1534",
    "flux-pr-1500",
    "flux-pr-1495",
    "flux-pr-1649",
    "flux-pr-1576",
    "flux-pr-1628",
    "flux-pr-2096",
    "flux-pr-2011",
    "flux-pr-2170",
    "flux-pr-1918",
    "flux-pr-1501",
    "flux-pr-1900",
    "flux-pr-1908",
    "flux-pr-1414",
    "flux-pr-1765",
    "flux-pr-1965",
    "flux-pr-1984",
    "flux-pr-2185"
  ],
  "exclude_task_ids": null,
  "n_tasks": null,
  "n_concurrent_trials": 4,
  "n_attempts": 1,
  "dataset_size": 30,
  "accuracy": 0.13333333333333333,
  "model_name": "gpt-5.1-codex-mini",
  "start_time": "2026-02-21T03:36:19.613445+00:00",
  "end_time": "2026-02-21T05:57:20.725706+00:00",
  "commit_hash": "f09baebe0424b002663dfd81a4ba49701bb870e3",
  "username": "Test User",
  "s3_bucket": null,
  "agent_kwargs": null,
  "pass_at_k": {},
  "resumed_at": null,
  "reasoning_effort": "medium"
}