[{"data":1,"prerenderedAt":127},["ShallowReactive",2],{"podcast-meta":3,"podcast-theme-colors":32,"episode-the-confident-idiot-problem-news":92},{"title":4,"author":5,"description":6,"artwork":7,"categories":8,"feedUrl":10,"type":11,"explicit":12,"link":13,"language":14,"copyright":15,"podcast2":16,"hasPeople":31},"The Changelog: Software Development, Open Source","Changelog Media","Software's best weekly news brief, deep technical interviews & talk show.","https://cdn.changelog.com/static/images/podcasts/podcast-original-f16d0363067166f241d080ee2e2d4a28.png",[9],"Technology","https://changelog.com/podcast/feed","episodic",false,"https://changelog.com/podcast","en-us","All rights reserved",{"persons":17,"funding":27},[18,23],{"name":19,"role":20,"img":21,"href":22},"Adam Stacoviak","host","https://cdn.changelog.com/uploads/avatars/people/Qo/avatar_large.jpg?v=63760280419","https://changelog.com/person/adamstac",{"name":24,"role":20,"img":25,"href":26},"Jerod Santo","https://cdn.changelog.com/uploads/avatars/people/z4/avatar_large.jpeg?v=63760071650","https://changelog.com/person/jerodsanto",[28],{"url":29,"text":30},"https://changelog.com/++","Support our work by joining Changelog++",true,{"palette":33,"sourceColor":54,"extractedColors":55},{"light":34,"dark":43},{"primary":35,"primary-foreground":36,"secondary":37,"secondary-foreground":35,"accent":38,"muted":39,"muted-foreground":40,"ring":35,"podcast-vibrant":41,"podcast-muted":42},"#00182f","#ffffff","#eff2f6","#e7ecf0","#f0f2f4","#6f7275","#0375c4","#e2e5e8",{"primary":44,"primary-foreground":45,"secondary":46,"secondary-foreground":47,"accent":48,"muted":49,"muted-foreground":50,"ring":51,"podcast-vibrant":52,"podcast-muted":53},"#5580a9","#09090b","#191b1d","#dcdee0","#1d2022","#1a1b1c","#8d8f91","#c1c4c8","#3694e6","#151618","#a1978d",[56,63,71,79,84],{"hex":54,"red":57,"green":58,"blue":59,"area":60,"saturation":61,"lightness":62},161,151,141,0.13136455555555557,0.09615384615384609,0.592156862745098,{"hex":64,"red":65,"green":66,"blue":67,"area":68,"saturation":69,"lightness":70},"#d2d1d4",210,209,212,0.000134,0.03370786516853954,0.8254901960784313,{"hex":72,"red":73,"green":74,"blue":75,"area":76,"saturation":77,"lightness":78},"#525153",82,81,83,0.003252888888888889,0.012195121951219556,0.32156862745098036,{"hex":36,"red":80,"green":80,"blue":80,"area":81,"saturation":82,"lightness":83},255,0.03285188888888889,0,1,{"hex":85,"red":86,"green":87,"blue":88,"area":89,"saturation":90,"lightness":91},"#101820",16,24,32,0.8323966666666667,0.3333333333333333,0.09411764705882353,{"meta":93,"episode":101,"transcript":124},{"title":4,"author":5,"description":6,"artwork":7,"categories":94,"feedUrl":10,"type":11,"explicit":12,"link":13,"language":14,"copyright":15,"podcast2":95,"hasPeople":31},[9],{"persons":96,"funding":99},[97,98],{"name":19,"role":20,"img":21,"href":22},{"name":24,"role":20,"img":25,"href":26},[100],{"url":29,"text":30},{"guid":102,"title":103,"slug":104,"description":105,"htmlContent":106,"audioUrl":107,"audioType":108,"audioLength":109,"pubDate":110,"duration":111,"artwork":112,"episodeType":113,"explicit":12,"link":114,"podcast2":115},"changelog.com/16/2796","The \"confident idiot\" problem (News)","the-confident-idiot-problem-news","Why AI needs hard rules (not vibe checks), what Anthropic's acquisition of Bun's creators tells us about the AI takeover, Jonah Glover couldn't get Claude to recreate Space Jam's 1996 website, Google finally unkills something, and Bazzite is a distro for the next generation of Linux gaming.","\u003Cp>Why AI needs hard rules (not vibe checks), what Anthropic’s acquisition of Bun’s creators tells us about the AI takeover, Jonah Glover couldn’t get Claude to recreate Space Jam’s 1996 website, Google finally unkills something, and Bazzite is a distro for the next generation of Linux gaming.\u003C/p>\n\u003Cp>\u003Ca href=\"https://changelog.com/news/173/email\">View the newsletter\u003C/a>\u003C/p>\u003Cp>\u003Ca href=\"https://changelog.zulipchat.com/#narrow/stream/455469-news\">Join the discussion\u003C/a>\u003C/p>\u003Cp>\u003Ca href=\"https://changelog.com/++\" rel=\"payment\">Changelog++\u003C/a> members support our work, get closer to the metal, and make the ads disappear. Join today!\u003C/p>\u003Cp>Sponsors:\u003C/p>\u003Cp>\u003Cul>\u003Cli>\u003Ca href=\"https://depot.dev\">Depot\u003C/a> – \u003Cstrong>10x faster builds? Yes please.\u003C/strong> Build faster. Waste less time. Accelerate Docker image builds, and GitHub Actions workflows. Easily integrate with your existing CI provider and dev workflows to save hours of build time.\n\u003C/li>\n\u003C/ul>\u003C/p>\u003Cp>Featuring:\u003C/p>\u003Cul>\u003Cli>Jerod Santo &ndash; \u003Ca href=\"https://jerodsanto.net\" rel=\"external ugc\">Website\u003C/a>, \u003Ca href=\"https://github.com/jerodsanto\" rel=\"external ugc\">GitHub\u003C/a>, \u003Ca href=\"https://www.linkedin.com/in/jerodsanto\" rel=\"external ugc\">LinkedIn\u003C/a>, \u003Ca href=\"https://changelog.social/@jerod\" rel=\"external ugc\">Mastodon\u003C/a>, \u003Ca href=\"https://x.com/jerodsanto\" rel=\"external ugc\">X\u003C/a>\u003C/li>\u003C/ul>\u003C/p>","https://op3.dev/e/https://pscrb.fm/rss/p/https://cdn.changelog.com/uploads/news/173/changelog-news-173.mp3","audio/mpeg",7653570,"Mon, 08 Dec 2025 20:00:00 +0000",467,"https://cdn.changelog.com/uploads/covers/changelog-news-original.png?v=63848365621","full","https://changelog.com/news/173",{"transcript":116,"chapters":119,"persons":122},{"url":117,"type":118},"https://changelog.com/news/173/transcript","text/html",{"url":120,"type":121},"https://changelog.com/news/173/chapters","application/json+chapters",[123],{"name":24,"role":20,"img":25,"href":26},{"content":125,"type":126,"url":117},"\u003C!DOCTYPE html>\n\u003Chtml>\n\u003Chead>\n  \u003Cmeta charset=\"utf-8\">\n  \u003Cmeta name=\"viewport\" content=\"width=device-width, initial-scale=1\">\n  \u003Cmeta name=\"robots\" content=\"noindex\">\n  \u003Clink rel=\"canonical\" href=\"https://changelog.com/news/173\"/>\n  \u003Ctitle>Transcript for Changelog News #173\u003C/title>\n\u003C/head>\n\u003Cbody>\n\n\n\n    \u003Ccite>Jerod Santo:\u003C/cite>\n    \u003Cp>What up, nerds? I&#39;m Jerod and this is Changelog News for the week of Monday, December 8th, 2025.\n\nWe&#39;re quickly approaching last call for [state of the &quot;log&quot;](https://changelog.com/topic/sotl) voicemails! We record in a week and have to give BMC time to make the remixes, so if you&#39;re thinking about [sending one](https://changelog.fm/sotl) in (you should), now&#39;s the best time!\n\nSubmit yours today at changelog.fm/sotl\n\nOk, let&#39;s get into this week&#39;s news.\u003C/p>\n\n\n    \u003Ccite>Break:\u003C/cite>\n    \u003Cp>\u003C/p>\n\n\n    \u003Ccite>Jerod Santo:\u003C/cite>\n    \u003Cp>[The &quot;confident idiot&quot; problem](https://steerlabs.substack.com/p/confident-idiot-problem)\n\n_Or, &quot;Why AI needs hard rules, not vibe checks&quot;_\n\nIf you&#39;ve been following the *how-do-we-actually-use-ai-in-production* conversation stream, you&#39;ve probably heard people propose a strategy where one LLM checks another LLM&#39;s results. But will that work?\n\n&gt; We are told to ask GPT-4o to grade GPT-3.5. We are told to fix the “vibes.”\n&gt;\n&gt; But this creates a dangerous circular dependency. If the underlying models suffer from sycophancy (agreeing with the user) or hallucination, a Judge model often hallucinates a passing grade.\n&gt;\n&gt; We are trying to fix probability with more probability. That is a losing game.\n\nOne possible way of dealing with these &quot;confident idiots&quot; we&#39;ve introduced into our software stacks the last few years is to &quot;stop treating agents like magic boxes and start treating them like software.&quot; Hence, the [Steer SDK](https://github.com/imtt-dev/steer) was created. \n\n&gt; Steer is an open-source Python library that intercepts agent failures (hallucinations, bad JSON, PII leaks) and allows you to inject fixes via a local dashboard without changing your code.\n\nAnother way of dealing with these &quot;confident idiots&quot; in our software stacks... remove them. If that&#39;s possible...\u003C/p>\n\n\n    \u003Ccite>Break:\u003C/cite>\n    \u003Cp>\u003C/p>\n\n\n    \u003Ccite>Jerod Santo:\u003C/cite>\n    \u003Cp>[Bun is joining Anthropic](https://bun.com/blog/bun-joins-anthropic)\n\nThe company behind Bun, which is the open source runtime for Claude Code, is joining Anthropic. We discussed the big acqui(sition|hire) on [last week&#39;s Friends](https://changelog.am/120), but at the time I hadn&#39;t quite considered this move and how contrary it is to Anthropic&#39;s party line that AI agents are replacing software engineers. From Anthropic&#39;s announcement:\n\n&gt; We’ve been a close partner of Bun for many months. Our collaboration has been central to the rapid execution of the Claude Code team, and it directly drove the recent launch of Claude Code’s native installer. We know the Bun team is building from the same vantage point that we do at Anthropic, with a focus on rethinking the developer experience and building innovative, useful products.\n\nBun is open source. Why not just fork it and have a Claude Code powered engineer make all the necessary changes/upgrades to the runtime that Anthropic needs? Because there&#39;s no getting there from here. At least not yet. Jarred Sumner and the Bun team&#39;s *expertise* is what&#39;s so valuable. Even to Anthropic.\u003C/p>\n\n\n    \u003Ccite>Break:\u003C/cite>\n    \u003Cp>\u003C/p>\n\n\n    \u003Ccite>Jerod Santo:\u003C/cite>\n    \u003Cp>[Claude can&#39;t recreate classic Space Jam site](https://j0nah.com/i-failed-to-recreate-the-1996-space-jam-website-with-claude)\n\nJonah Glover tried to recreate everyone&#39;s favorite [1996 website](https://www.spacejam.com/1996/) by giving Claude Code (running Opus 4.1) a screenshot of the site and all the associated assets. It failed (repeatedly) in all the ways I would expect from my own frontend / design attempts with the tool. Jonah&#39;s finding, which is quite relatable:\n\n&gt; Once Claude&#39;s version existed, every grid overlay, every comparison step, every &quot;precise&quot; adjustment was anchored to his layout, not the real one. At the end of all this, I&#39;m left with the irritating fact that, like many engineers, he&#39;s wrong and he thinks he&#39;s right.\n&gt;\n&gt; What this teaches me is that Claude is actually kind of a liar, or at least Claude is confused. However, for the drama, I&#39;ll assume Claude is a liar.\n\nI&#39;ve been giving Claude Code a lot of props lately, but I&#39;ve also been giving it a lot of tasks it just can&#39;t quite accomplish. This process starts off as fun and interesting, but each time it ends in failure I am perplexed by all the possible failure paths. Was it me and my prompting? Was it the agent? Was it the model? Or perhaps I&#39;m asking for things that aren&#39;t easily accomplished with today&#39;s tech? (I can be quite demanding.)\n\nThis makes me yearn for the days when the only one to blame for my failures was me...\u003C/p>\n\n\n    \u003Ccite>Break:\u003C/cite>\n    \u003Cp>\u003C/p>\n\n\n    \u003Ccite>Jerod Santo:\u003C/cite>\n    \u003Cp>It&#39;s now time for sponsored news!\n\n[Depot&#39;s Advent of Code 2025](https://depot.dev/events/advent-of-code-2025)\n\nDepot is running a community leaderboard for Advent of Code 2025 and they&#39;re **putting real money behind it**.\n\nThe top five finishers each direct $1,000 to a registered charity of their choice. If you pick a charity supporting STEM education or the developer ecosystem, Depot adds a 50% bonus. They&#39;ve already generated $7,500 in donations.\n\nThe format: 12 days of puzzles, unlocking daily at midnight EST starting December 1st. Solve at your own pace. There&#39;s no time limit. Any language, any skill level. Each day brings a two-part programming challenge from Eric Wastl&#39;s Advent of Code.\n\nTo join Depot&#39;s private leaderboard, request access on their events page. They&#39;ll send you a code. Whether you&#39;re competing for the top 5 or just want to sharpen your skills alongside other devs, it&#39;s a good excuse to write some code this month.\n\nCheck it out at [depot.dev/events/advent-of-code-2025](https://depot.dev/events/advent-of-code-2025) or just follow the link in the newsletter and your chapter data\u003C/p>\n\n\n    \u003Ccite>Break:\u003C/cite>\n    \u003Cp>\u003C/p>\n\n\n    \u003Ccite>Jerod Santo:\u003C/cite>\n    \u003Cp>[Google *unkills* JPEG XL?](https://tonisagrista.com/blog/2025/google-unkills-jpegxl/)\n\n&gt; In a dramatic turn of events, the Chromium team has reversed its &quot;Obsolete&quot; tag, and has decided to support the format in Blink (the engine behind Chrome/Chromium/Edge). Given Chrome’s position in the browser market share, I predict the format will become a de factor standard for images in the near future.\n\nWe&#39;re used to things being [killed by Google](https://killedbygoogle.com)... but *unkilled*?! This is a trend I can get behind. Unkill requests! \n\nIt&#39;s time to bring back [Zeitgeist](https://web.archive.org/web/20210312230138/https://www.lifewire.com/google-zeitgeist-3481903), [Dodgeball](https://en.wikipedia.org/wiki/Dodgeball_(service)), and [Google Reader](https://en.wikipedia.org/wiki/Google_Reader)...\u003C/p>\n\n\n    \u003Ccite>Break:\u003C/cite>\n    \u003Cp>\u003C/p>\n\n\n    \u003Ccite>Jerod Santo:\u003C/cite>\n    \u003Cp>[The next generation of Linux gaming](https://bazzite.gg/)\n\nIf the mythical &quot;Year of the Linux Desktop&quot; is ever to materialize, it will first be preceded by a sea change in gaming options for the venerable open source OS. The gaming sea change appears to be in full swing, with Steam on Linux hitting an all-time high over 3% usage [last month](https://www.phoronix.com/news/Steam-Linux-November-2025).\n\nEnter Bazzite, a Fedora-based Linux distro that&#39;s hyper-focused on making gaming awesome:\n\n&gt; Bazzite is designed for Linux newcomers and enthusiasts alike with Steam pre-installed, HDR &amp; VRR support, improved CPU schedulers for responsive gameplay, and numerous community-developed tools and tweaks to streamline your gaming and streaming experience.\n\nThe project began back in 2023, but it appears to be maturing and aiming at sustainability by setting up ways to donate with its [latest update](https://universal-blue.discourse.group/t/bazzite-fall-update-fedora-43-xbox-allies-legion-go-2-nvidia-gtx/10948):\n\n&gt; As Bazzite matures, we begin to tackle more ambitious projects, such as proper secure boot, support for more handheld devices, and conference attendance, which means more costs for us. And we would gladly appreciate the help in covering them!\u003C/p>\n\n\n    \u003Ccite>Break:\u003C/cite>\n    \u003Cp>\u003C/p>\n\n\n    \u003Ccite>Jerod Santo:\u003C/cite>\n    \u003Cp>That&#39;s the news for now, but go and subscribe to the Changelog Newsletter for the full scoop of links worth clicking on. Such as:\n\n- [Why I ignore the spotlight as a staff engineer](https://lalitm.com/software-engineering-outside-the-spotlight/)\n- [Vanilla CSS is all you need](https://www.zolkos.com/2025/12/03/vanilla-css-is-all-you-need)\n- [What happens when you take an XKCD joke too literally](https://stacktower.io)\n\nGet in on the newsletter at changelog.news\n\nHave a great week! Like, subscribe, and leave us a 5-star review if you dig the show, and I&#39;ll talk to you again real soon.\u003C/p>\n\n\u003C/body>\n\u003C/html>\n","text/html; charset=utf-8",1771793543563]