{"id":"run-71345cab5274","serviceId":"anthropic-claude","benchmarkId":"mmlu","model":"claude-haiku-4.5","score":87.5,"runs":1,"breakdown":{"n":8,"passes":7,"mean_raw":0.875},"sampleCount":8,"runnerVersion":"benchlist-vercel-inline@1.0.0","runnerCommit":"edge","datasetHash":"sha256:05ef744f592cd2481092a6ecdecbccaf5e515f6ac2be7d5fc77ad85b8165f15c","methodologyHash":"sha256:f65dba1e549ab81ea004be624791ae7b7b3e784648c0cb2ce84b8bf930bb0457","transcriptMerkleRoot":"sha256:6a06687deb4e771ef77943cde919002b8d27b27ab6ce8d20cef1bdeced61dbd4","startedAt":"2026-04-26T08:37:36.799Z","finishedAt":"2026-04-26T08:38:10.075Z","durationSeconds":33,"decoding":{"temperature":0,"max_tokens":512},"attestor":"benchlist-vercel-inline-0","publisher":"anthropic-claude","replay":{"command":"benchlist run mmlu --service anthropic-claude --model claude-haiku-4.5 --runs 1 --limit 8","dockerImage":"ghcr.io/benchlist/runner:latest","envRequired":[]},"proof":{"system":"signed-attestation","status":"signed","signature":"3472ab4b892ec00c3309b3e73fc456e6366d8a5f7f544f94425c7a1614bdf12bb7c0b11ec3623188aa5b9589db7db2de183c14d57e5236868e819a5479b30706","pubkey":"cb6e95d0f7b402e254f491b57767df3a3a93ae92f1faee3a02aa52e728f5cd11","signer_algo":"ed25519","public_inputs":{"dataset_hash":"sha256:05ef744f592cd2481092a6ecdecbccaf5e515f6ac2be7d5fc77ad85b8165f15c","methodology_hash":"sha256:f65dba1e549ab81ea004be624791ae7b7b3e784648c0cb2ce84b8bf930bb0457","merkle_root":"sha256:6a06687deb4e771ef77943cde919002b8d27b27ab6ce8d20cef1bdeced61dbd4","claimed_score":87.5}},"verification":{"mode":"signed-attestation","status":"attested","alignedProofSystem":"signed-attestation","attestorPubkey":"cb6e95d0f7b402e254f491b57767df3a3a93ae92f1faee3a02aa52e728f5cd11","attestorSignature":"3472ab4b892ec00c3309b3e73fc456e6366d8a5f7f544f94425c7a1614bdf12bb7c0b11ec3623188aa5b9589db7db2de183c14d57e5236868e819a5479b30706","signerAlgo":"ed25519","submittedAt":"2026-04-26T08:38:10.075Z","verifiedAt":"2026-04-26T08:38:10.075Z","note":"Signed inline by Benchlist Vercel attestor. Set ATTESTOR_PRIVATE_KEY on a GH/Railway worker to add Ethereum L1 anchor."}}