{"id":"run-99412c69b7dc","serviceId":"anthropic-claude","benchmarkId":"hellaswag","model":"claude-haiku-4.5","score":100,"runs":1,"breakdown":{"n":8,"passes":8,"mean_raw":1},"sampleCount":8,"runnerVersion":"benchlist-vercel-inline@1.0.0","runnerCommit":"edge","datasetHash":"sha256:b967f14e9705f2c1512bfecbc280340660ac60811aca2cd09789d654cb44b3ee","methodologyHash":"sha256:2725c767f087367a0bbb3d937db51573191931b9f2e7a805d74297244330c18f","transcriptMerkleRoot":"sha256:dd5f6d663d8dcaed58270faafcf0e397def41f4aacab6d18920d0fe2f747e351","startedAt":"2026-04-26T07:43:31.439Z","finishedAt":"2026-04-26T07:52:00.617Z","durationSeconds":509,"decoding":{"temperature":0,"max_tokens":512},"attestor":"benchlist-vercel-inline-0","publisher":"anthropic-claude","replay":{"command":"benchlist run hellaswag --service anthropic-claude --model claude-haiku-4.5 --runs 1 --limit 8","dockerImage":"ghcr.io/benchlist/runner:latest","envRequired":[]},"proof":{"system":"signed-attestation","status":"signed","signature":"7d26da4d17e9c8c3b5a9e59a6444ca5b649c256fa8c0ec7ca0cc23ebbf49e248ed057b4c0c49952e2bc2061fa82aee2ee8de0bcdf57e029c1aa10d02f166480d","pubkey":"cb6e95d0f7b402e254f491b57767df3a3a93ae92f1faee3a02aa52e728f5cd11","signer_algo":"ed25519","public_inputs":{"dataset_hash":"sha256:b967f14e9705f2c1512bfecbc280340660ac60811aca2cd09789d654cb44b3ee","methodology_hash":"sha256:2725c767f087367a0bbb3d937db51573191931b9f2e7a805d74297244330c18f","merkle_root":"sha256:dd5f6d663d8dcaed58270faafcf0e397def41f4aacab6d18920d0fe2f747e351","claimed_score":100}},"verification":{"mode":"signed-attestation","status":"attested","alignedProofSystem":"signed-attestation","attestorPubkey":"cb6e95d0f7b402e254f491b57767df3a3a93ae92f1faee3a02aa52e728f5cd11","attestorSignature":"7d26da4d17e9c8c3b5a9e59a6444ca5b649c256fa8c0ec7ca0cc23ebbf49e248ed057b4c0c49952e2bc2061fa82aee2ee8de0bcdf57e029c1aa10d02f166480d","signerAlgo":"ed25519","submittedAt":"2026-04-26T07:52:00.617Z","verifiedAt":"2026-04-26T07:52:00.617Z","note":"Signed inline by Benchlist Vercel attestor. Set ATTESTOR_PRIVATE_KEY on a GH/Railway worker to add Ethereum L1 anchor."}}