<?xml version="1.0" encoding="utf-8"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
    <channel>
        <title>What Do Models Still Suck At? - Peter Gostev, Arena.ai, BullshitBench</title>
        <link>https://video.ut0pia.org/videos/watch/8936a916-fd11-4109-a898-f2ffb162c5d7</link>
        <description>What type of real world model responses do users still hate? We get to see millions of user's prompts - and we let users 'dislike both' on the Arena. We'll show you trends and examples of the tasks that LLMs still suck at despite the relentless hillclimbing. Speaker info: https://x.com/petergostev, https://www.linkedin.com/in/peter-gostev/</description>
        <lastBuildDate>Sat, 25 Apr 2026 11:41:47 GMT</lastBuildDate>
        <docs>https://validator.w3.org/feed/docs/rss2.html</docs>
        <generator>PeerTube - https://video.ut0pia.org</generator>
        <image>
            <title>What Do Models Still Suck At? - Peter Gostev, Arena.ai, BullshitBench</title>
            <url>https://video.ut0pia.org/lazy-static/avatars/0287a09a-aae7-4840-9843-b416426e7046.webp</url>
            <link>https://video.ut0pia.org/videos/watch/8936a916-fd11-4109-a898-f2ffb162c5d7</link>
        </image>
        <copyright>All rights reserved, unless otherwise specified in the terms specified at https://video.ut0pia.org/about and potential licenses granted by each content's rightholder.</copyright>
        <atom:link href="https://video.ut0pia.org/feeds/video-comments.xml?videoId=8936a916-fd11-4109-a898-f2ffb162c5d7" rel="self" type="application/rss+xml"/>
    </channel>
</rss>