Experimental browser for the Atmosphere
MLCommons' MLPerf Training suite has a new #pretraining #benchmark based on #Meta’s Llama 3.1 405B model. We use the same dataset with a bigger model and longer context, offering a more relevant and challenging measure for today’s #AI systems. mlcommons.org/2025/05/trai...
May 5, 2025, 4:22 PM
{ "uri": "at://did:plc:uavs3b5de27ki26k5usmqtxz/app.bsky.feed.post/3logrn6qjm22d", "cid": "bafyreich5qo6itdihkkkplruojdhblaun2b4x4jh6as2pjpng3pu6lyhda", "value": { "text": "MLCommons' MLPerf Training suite has a new #pretraining #benchmark based on #Meta’s Llama 3.1 405B model. We use the same dataset with a bigger model and longer context, offering a more relevant and challenging measure for today’s #AI systems. mlcommons.org/2025/05/trai...", "$type": "app.bsky.feed.post", "embed": { "$type": "app.bsky.embed.external", "external": { "uri": "https://mlcommons.org/2025/05/training-llama31405b/", "thumb": { "$type": "blob", "ref": { "$link": "bafkreidqwzc47bspqsowjlng7ab42r4v6k4cstpkznqxcg5bo5o4qqblr4" }, "mimeType": "image/jpeg", "size": 312053 }, "title": "MLCommons MLPerf Training Expands with Llama 3.1 405B - MLCommons", "description": "MLCommons MLPerf Training Expands with Llama 3.1 405B" } }, "langs": [ "en" ], "facets": [ { "index": { "byteEnd": 55, "byteStart": 43 }, "features": [ { "tag": "pretraining", "$type": "app.bsky.richtext.facet#tag" } ] }, { "index": { "byteEnd": 66, "byteStart": 56 }, "features": [ { "tag": "benchmark", "$type": "app.bsky.richtext.facet#tag" } ] }, { "index": { "byteEnd": 85, "byteStart": 76 }, "features": [ { "tag": "Meta’s", "$type": "app.bsky.richtext.facet#tag" } ] }, { "index": { "byteEnd": 238, "byteStart": 235 }, "features": [ { "tag": "AI", "$type": "app.bsky.richtext.facet#tag" } ] }, { "index": { "byteEnd": 278, "byteStart": 249 }, "features": [ { "uri": "https://mlcommons.org/2025/05/training-llama31405b/", "$type": "app.bsky.richtext.facet#link" } ] } ], "createdAt": "2025-05-05T16:22:00.296Z" } }