Experimental browser for the Atmosphere
Incredibly excited to have this finally come out! Model evaluation should be about comparisons, so we have a metric that puts comparisons in predictive performance on a common scale. I can’t make a thread about this better than @crahal.com, so I’ll let him take it away.
Mar 28, 2025, 3:43 AM
{ "uri": "at://did:plc:eiq3eh7v4xku6bfvscfht3ug/app.bsky.feed.post/3llfvj4sggc2k", "cid": "bafyreia35xxfaw4et7oqqy4h6hej7awwiyntwbki5lwsozoc64u2iuzwni", "value": { "text": "Incredibly excited to have this finally come out! Model evaluation should be about comparisons, so we have a metric that puts comparisons in predictive performance on a common scale. I can’t make a thread about this better than @crahal.com, so I’ll let him take it away.", "$type": "app.bsky.feed.post", "embed": { "$type": "app.bsky.embed.record", "record": { "cid": "bafyreid2xzflfu3ujzs6i6kpg32lcykut4hhf2nk5fcvztk4wh273fnjd4", "uri": "at://did:plc:3eqqhalroalwrnikhbwqtgki/app.bsky.feed.post/3llekxw2l5k26" } }, "langs": [ "en" ], "facets": [ { "$type": "app.bsky.richtext.facet", "index": { "byteEnd": 241, "byteStart": 230 }, "features": [ { "did": "did:plc:3eqqhalroalwrnikhbwqtgki", "$type": "app.bsky.richtext.facet#mention" } ] } ], "createdAt": "2025-03-28T03:43:04.388Z" } }