Experimental browser for the Atmosphere
Introducing olmOCR, our open-source tool to extract clean plain text from PDFs! Built for scale, olmOCR handles many document types with high throughput. Run it on your own GPU for free—at over 3000 token/s, equivalent to $190 per million pages, or 1/32 the cost of GPT-4o!
Feb 25, 2025, 5:03 PM
{ "uri": "at://did:plc:i4kytxgsu3yfsrt2ml3o7tgq/app.bsky.feed.post/3lizdsmfba22n", "cid": "bafyreihln7qm7ealjqahpozbwbcjdohq6nmebt6a4gv6cd4lzobbopmx5q", "value": { "text": "Introducing olmOCR, our open-source tool to extract clean plain text from PDFs!\n\nBuilt for scale, olmOCR handles many document types with high throughput. Run it on your own GPU for free—at over 3000 token/s, equivalent to $190 per million pages, or 1/32 the cost of GPT-4o!", "$type": "app.bsky.feed.post", "embed": { "$type": "app.bsky.embed.video", "video": { "$type": "blob", "ref": { "$link": "bafkreigksekmzaqjgoeopmxwnuehidhkwdirgsahonvz53v2ceex4lgx5e" }, "mimeType": "video/mp4", "size": 815323 }, "aspectRatio": { "width": 1548, "height": 942 } }, "langs": [ "en" ], "createdAt": "2025-02-25T17:03:55.257Z" } }