{
"$type": "site.standard.document",
"bskyPostRef": {
"cid": "bafyreicuhvwotknqjmqhpzwh5325ndtrnvcovee3oq5m3xtt24z6r557s4",
"uri": "at://did:plc:oldu4osfqstkn27t4qzsrgtf/app.bsky.feed.post/3mjbzl2ptg3k2"
},
"path": "/blog/trustworthy-benchmarks-cont/",
"publishedAt": "2026-04-11T19:15:56.000Z",
"site": "https://rdi.berkeley.edu",
"tags": [
"Comments"
],
"textContent": "Comments",
"title": "How We Broke Top AI Agent Benchmarks: And What Comes Next"
}