Experimental browser for the Atmosphere
I wrote about a new AI evaluation called "Humanity's Last Exam," a collection of 3,000 questions submitted by leading academics to try to stump leading AI models, which mostly find today's college-level tests too easy. www.nytimes.com/2025/01/23/t...
Jan 23, 2025, 4:41 PM
{ "uri": "at://did:plc:743s7ikb5po2orglxfs43ins/app.bsky.feed.post/3lggd5tbwes2n", "cid": "bafyreie36vgh5h5adpbgcu4hmlbef433h7cgi5py653b6rnan2h4nezhcy", "value": { "text": "I wrote about a new AI evaluation called \"Humanity's Last Exam,\" a collection of 3,000 questions submitted by leading academics to try to stump leading AI models, which mostly find today's college-level tests too easy.\n\nwww.nytimes.com/2025/01/23/t...", "$type": "app.bsky.feed.post", "embed": { "$type": "app.bsky.embed.external", "external": { "uri": "https://www.nytimes.com/2025/01/23/technology/ai-test-humanitys-last-exam.html?unlocked_article_code=1.rU4.VoJE.ZK8gbYYFh2T6&smid=url-share", "thumb": { "$type": "blob", "ref": { "$link": "bafkreiaboffietvfhn4lfkgaq5jruvazhmpyhyi5todouw4myootkv24rq" }, "mimeType": "image/jpeg", "size": 508105 }, "title": "A Test So Hard No AI System Can Pass It — Yet (Gift Article)", "description": "The creators of a new test called “Humanity’s Last Exam” argue we may soon lose the ability to create tests hard enough for A.I. models." } }, "langs": [ "en" ], "facets": [ { "index": { "byteEnd": 251, "byteStart": 220 }, "features": [ { "uri": "https://www.nytimes.com/2025/01/23/technology/ai-test-humanitys-last-exam.html?unlocked_article_code=1.rU4.VoJE.ZK8gbYYFh2T6&smid=url-share", "$type": "app.bsky.richtext.facet#link" } ] } ], "createdAt": "2025-01-23T16:41:19.559Z" } }