{
    "id": "2e9e7af6-b438-43d5-a77b-97df3aa4cdbb",
    "started_at": "2026-06-29T15:29:30.066688",
    "updated_at": "2026-06-29T16:41:54.013443",
    "finished_at": "2026-06-29T16:41:54.013443",
    "n_total_trials": 89,
    "stats": {
        "n_completed_trials": 89,
        "n_errored_trials": 22,
        "n_running_trials": 0,
        "n_pending_trials": 0,
        "n_cancelled_trials": 0,
        "n_retries": 4,
        "evals": {
            "atlarix__minimax/minimax-m3__terminal-bench/terminal-bench-2": {
                "n_trials": 88,
                "n_errors": 22,
                "metrics": [
                    {
                        "mean": 0.47191011235955055
                    }
                ],
                "pass_at_k": {},
                "reward_stats": {
                    "reward": {
                        "0.0": [
                            "make-mips-interpreter__ok2EnrM",
                            "overfull-hbox__UACGxKE",
                            "video-processing__KurwFyX",
                            "break-filter-js-from-html__DifMq7d",
                            "protein-assembly__hTJjKGB",
                            "path-tracing__uyrgLyx",
                            "compile-compcert__hQEhGTH",
                            "dna-assembly__36KyKRG",
                            "caffe-cifar-10__oNUwddW",
                            "install-windows-3-11__wpuEZUR",
                            "crack-7z-hash__BeAsLed",
                            "feal-linear-cryptanalysis__gCdiNjs",
                            "polyglot-rust-c__XNs5Y5T",
                            "cancel-async-tasks__faE3wCc",
                            "rstan-to-pystan__ooEW8tq",
                            "db-wal-recovery__mK4ospC",
                            "winning-avg-corewars__zhatMX4",
                            "mteb-leaderboard__QPUJCVB",
                            "regex-chess__Z7igEqh",
                            "write-compressor__qz5NoFo",
                            "chess-best-move__cmP7RdL",
                            "extract-moves-from-video__F4gdYnr",
                            "gcode-to-text__PZ32rKK",
                            "merge-diff-arc-agi-task__AWVP5UT",
                            "qemu-alpine-ssh__pPuM6cH",
                            "tune-mjcf__z5nyhgt",
                            "sqlite-with-gcov__CK4RDve",
                            "sanitize-git-repo__AdhiUz7",
                            "train-fasttext__Hq3YFXp",
                            "torch-tensor-parallelism__Ld7ppxD",
                            "torch-pipeline-parallelism__cc2NiU9",
                            "raman-fitting__wYw5sEC",
                            "model-extraction-relu-logits__Wn2h885",
                            "filter-js-from-html__YnkynVw",
                            "polyglot-c-py__qS9qiCq",
                            "pytorch-model-cli__oEVD8bm",
                            "bn-fit-modify__2hezsmm",
                            "password-recovery__EpK3sbf",
                            "sam-cell-seg__d5gXkCS",
                            "make-doom-for-mips__LBEMoJo",
                            "adaptive-rejection-sampler__ScbSxe2",
                            "gpt2-codegolf__8vBMp8W",
                            "mcmc-sampling-stan__zJefgMr",
                            "path-tracing-reverse__ZLsB2CJ",
                            "llm-inference-batching-scheduler__iiH4oGV",
                            "configure-git-webserver__gYfyrnv"
                        ],
                        "1.0": [
                            "circuit-fibsqrt__4yMBQzB",
                            "build-pov-ray__CREWSJP",
                            "distribution-search__4Bj59gd",
                            "log-summary-date-ranges__g7gg8Rc",
                            "vulnerable-secret__eb5NJs2",
                            "openssl-selfsigned-cert__G7x3J5j",
                            "dna-insert__sN57rR8",
                            "git-leak-recovery__q3WNoBJ",
                            "headless-terminal__W2RCzmx",
                            "extract-elf__LBais9y",
                            "constraints-scheduling__jHWsuzX",
                            "custom-memory-heap-crash__HF88Rmo",
                            "build-cython-ext__PSfLuFW",
                            "fix-git__ZKzEjyJ",
                            "prove-plus-comm__LVzTaGB",
                            "pytorch-model-recovery__PZhtUkF",
                            "mailman__G3oVanB",
                            "multi-source-data-merger__5fYtPFH",
                            "kv-store-grpc__qFLgvRw",
                            "git-multibranch__Xac54xS",
                            "regex-log__MLUkAgT",
                            "nginx-request-logging__TaNkaMs",
                            "build-pmars__WowFyPh",
                            "reshard-c4-data__pAvEVhA",
                            "schemelike-metacircular-eval__JBHq25a",
                            "count-dataset-tokens__fEvGLCH",
                            "cobol-modernization__zTNVaUD",
                            "pypi-server__t5EjgMr",
                            "hf-model-inference__DCsjyca",
                            "sparql-university__SmCEnfG",
                            "largest-eigenval__eHGhiM2",
                            "fix-ocaml-gc__A6BwQEe",
                            "feal-differential-cryptanalysis__6NCAhGG",
                            "sqlite-db-truncate__rDpsMUF",
                            "fix-code-vulnerability__WY4zuHX",
                            "modernize-scientific-stack__ve7fAon",
                            "financial-document-processor__mrMgy6W",
                            "mteb-retrieve__oRTVAEk",
                            "large-scale-text-editing__yD7NpWc",
                            "code-from-image__JMS6U9Q",
                            "portfolio-optimization__S3Qoudf",
                            "qemu-startup__oES5aXV"
                        ]
                    }
                },
                "exception_stats": {
                    "AgentTimeoutError": [
                        "make-mips-interpreter__ok2EnrM",
                        "break-filter-js-from-html__DifMq7d",
                        "path-tracing__uyrgLyx",
                        "dna-assembly__36KyKRG",
                        "crack-7z-hash__BeAsLed",
                        "polyglot-rust-c__XNs5Y5T",
                        "regex-chess__Z7igEqh",
                        "write-compressor__qz5NoFo",
                        "gcode-to-text__PZ32rKK",
                        "qemu-alpine-ssh__pPuM6cH",
                        "tune-mjcf__z5nyhgt",
                        "torch-pipeline-parallelism__cc2NiU9",
                        "largest-eigenval__eHGhiM2",
                        "polyglot-c-py__qS9qiCq",
                        "password-recovery__EpK3sbf",
                        "make-doom-for-mips__LBEMoJo",
                        "adaptive-rejection-sampler__ScbSxe2",
                        "gpt2-codegolf__8vBMp8W",
                        "large-scale-text-editing__yD7NpWc",
                        "path-tracing-reverse__ZLsB2CJ",
                        "llm-inference-batching-scheduler__iiH4oGV"
                    ],
                    "VerifierTimeoutError": [
                        "query-optimize__8oAHba4"
                    ]
                }
            }
        },
        "n_input_tokens": null,
        "n_cache_tokens": null,
        "n_output_tokens": null,
        "cost_usd": null
    }
}