STET

trajectory

validation/gpt-5-1-codex-mini/flux-pr-1240/trajectory.v1.json

15381 bytes

Back to adjudication
{
  "version": "v1",
  "materialization": {
    "mode": "canonical"
  },
  "identity": {
    "variant_id": "gpt-5-1-codex-mini",
    "requested_model": "gpt-5-1-codex-mini",
    "model_key": "gpt-5-1-codex-mini",
    "run_id": "2026-02-21__03-36-16__gpt-5-1-codex-mini",
    "task_id": "flux-pr-1240",
    "trial_name": "flux-pr-1240.1-of-1.2026-02-21__03-36-16__gpt-5-1-codex-mini"
  },
  "availability": "partial_order_only",
  "state_detail": "provider-native trajectory captured; validation and decision steps are appended with coarse ordering only",
  "provider": "codex",
  "steps": [
    {
      "id": "step-01",
      "index": 0,
      "kind": "session_start",
      "title": "Session started",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-02",
      "index": 1,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-03",
      "index": 2,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 0",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-04",
      "index": 3,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-05",
      "index": 4,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 0",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-06",
      "index": 5,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-07",
      "index": 6,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 0",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-08",
      "index": 7,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-09",
      "index": 8,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 0",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-10",
      "index": 9,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-11",
      "index": 10,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 0",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-12",
      "index": 11,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-13",
      "index": 12,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 0",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-14",
      "index": 13,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-15",
      "index": 14,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 0",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-16",
      "index": 15,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-17",
      "index": 16,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 0",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-18",
      "index": 17,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-19",
      "index": 18,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 0",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-20",
      "index": 19,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-21",
      "index": 20,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 2",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-22",
      "index": 21,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-23",
      "index": 22,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 0",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-24",
      "index": 23,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-25",
      "index": 24,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 1",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-26",
      "index": 25,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-27",
      "index": 26,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 0",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-28",
      "index": 27,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-29",
      "index": 28,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 0",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-30",
      "index": 29,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-31",
      "index": 30,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 0",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-32",
      "index": 31,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-33",
      "index": 32,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 2",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-34",
      "index": 33,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-35",
      "index": 34,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 0",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-36",
      "index": 35,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-37",
      "index": 36,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 0",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-38",
      "index": 37,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-39",
      "index": 38,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 0",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-40",
      "index": 39,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-41",
      "index": 40,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 0",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-42",
      "index": 41,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-43",
      "index": 42,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 0",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-44",
      "index": 43,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-45",
      "index": 44,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 0",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-46",
      "index": 45,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-47",
      "index": 46,
      "kind": "tool_result",
      "title": "Command finished",
      "detail": "shell command exit code 0",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-48",
      "index": 47,
      "kind": "tool_call",
      "title": "Command started",
      "detail": "shell command",
      "evidence": [
        {
          "artifact_kind": "results",
          "label": "results"
        }
      ]
    },
    {
      "id": "step-49",
      "index": 48,
      "kind": "patch_written",
      "title": "Patch captured",
      "detail": "Flux captured agent.patch for this trial",
      "evidence": [
        {
          "artifact_kind": "agent_patch",
          "label": "agent.patch"
        }
      ]
    },
    {
      "id": "step-50",
      "index": 49,
      "kind": "validation",
      "title": "Tests passed",
      "detail": "go",
      "evidence": [
        {
          "artifact_kind": "validation",
          "label": "validation"
        }
      ]
    },
    {
      "id": "step-51",
      "index": 50,
      "kind": "equivalence",
      "title": "Equivalence judgment",
      "detail": "equivalent",
      "evidence": [
        {
          "artifact_kind": "validation",
          "label": "validation"
        }
      ]
    },
    {
      "id": "step-52",
      "index": 51,
      "kind": "code_review",
      "title": "Code review judgment",
      "detail": "unsure",
      "evidence": [
        {
          "artifact_kind": "task_detail",
          "label": "task detail"
        }
      ]
    },
    {
      "id": "step-53",
      "index": 52,
      "kind": "decision",
      "title": "Final decision",
      "detail": "pass",
      "evidence": [
        {
          "artifact_kind": "task_detail",
          "label": "task detail"
        }
      ]
    }
  ],
  "provenance": [
    {
      "source": "provider_native",
      "available": true,
      "detail": "codex provider-native trajectory copied into agent-logs"
    },
    {
      "source": "validation",
      "available": true
    },
    {
      "source": "task_detail",
      "available": true,
      "fallback": true,
      "detail": "validation and decision steps appended after provider-native events with coarse ordering only"
    }
  ]
}