<?xml version="1.0" encoding="UTF-8"?><rss xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:atom="http://www.w3.org/2005/Atom" version="2.0" xmlns:itunes="http://www.itunes.com/dtds/podcast-1.0.dtd" xmlns:googleplay="http://www.google.com/schemas/play-podcasts/1.0"><channel><title><![CDATA[BoxCars AI]]></title><description><![CDATA[AI. Strategy. Insights.]]></description><link>https://blog.boxcars.ai</link><image><url>https://substackcdn.com/image/fetch/$s_!lhIv!,w_256,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa43b3a40-40f4-4f9d-b843-b52a17a80bb9_1024x1024.png</url><title>BoxCars AI</title><link>https://blog.boxcars.ai</link></image><generator>Substack</generator><lastBuildDate>Fri, 10 Apr 2026 12:00:05 GMT</lastBuildDate><atom:link href="https://blog.boxcars.ai/feed" rel="self" type="application/rss+xml"/><copyright><![CDATA[BoxCars AI]]></copyright><language><![CDATA[en]]></language><webMaster><![CDATA[boxcarsai@substack.com]]></webMaster><itunes:owner><itunes:email><![CDATA[boxcarsai@substack.com]]></itunes:email><itunes:name><![CDATA[Tabrez Syed]]></itunes:name></itunes:owner><itunes:author><![CDATA[Tabrez Syed]]></itunes:author><googleplay:owner><![CDATA[boxcarsai@substack.com]]></googleplay:owner><googleplay:email><![CDATA[boxcarsai@substack.com]]></googleplay:email><googleplay:author><![CDATA[Tabrez Syed]]></googleplay:author><itunes:block><![CDATA[Yes]]></itunes:block><item><title><![CDATA[From Second Brain to Shared Brain]]></title><description><![CDATA[The hottest idea in AI this week is something a German sociologist figured out with index cards in 1953.]]></description><link>https://blog.boxcars.ai/p/from-second-brain-to-shared-brain</link><guid isPermaLink="false">https://blog.boxcars.ai/p/from-second-brain-to-shared-brain</guid><dc:creator><![CDATA[Tabrez Syed]]></dc:creator><pubDate>Thu, 09 Apr 2026 13:03:09 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1770869731843-bd36aa92403c?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZmlsaW5nJTIwY2FiaW5ldHxlbnwwfHx8fDE3NzU2NzIxMzV8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1770869731843-bd36aa92403c?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZmlsaW5nJTIwY2FiaW5ldHxlbnwwfHx8fDE3NzU2NzIxMzV8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1770869731843-bd36aa92403c?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZmlsaW5nJTIwY2FiaW5ldHxlbnwwfHx8fDE3NzU2NzIxMzV8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1770869731843-bd36aa92403c?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZmlsaW5nJTIwY2FiaW5ldHxlbnwwfHx8fDE3NzU2NzIxMzV8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1770869731843-bd36aa92403c?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZmlsaW5nJTIwY2FiaW5ldHxlbnwwfHx8fDE3NzU2NzIxMzV8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1770869731843-bd36aa92403c?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZmlsaW5nJTIwY2FiaW5ldHxlbnwwfHx8fDE3NzU2NzIxMzV8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1770869731843-bd36aa92403c?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZmlsaW5nJTIwY2FiaW5ldHxlbnwwfHx8fDE3NzU2NzIxMzV8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" width="6000" height="4000" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1770869731843-bd36aa92403c?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZmlsaW5nJTIwY2FiaW5ldHxlbnwwfHx8fDE3NzU2NzIxMzV8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:4000,&quot;width&quot;:6000,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;Wall of vintage wooden filing cabinet drawers&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="Wall of vintage wooden filing cabinet drawers" title="Wall of vintage wooden filing cabinet drawers" srcset="https://images.unsplash.com/photo-1770869731843-bd36aa92403c?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZmlsaW5nJTIwY2FiaW5ldHxlbnwwfHx8fDE3NzU2NzIxMzV8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1770869731843-bd36aa92403c?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZmlsaW5nJTIwY2FiaW5ldHxlbnwwfHx8fDE3NzU2NzIxMzV8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1770869731843-bd36aa92403c?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZmlsaW5nJTIwY2FiaW5ldHxlbnwwfHx8fDE3NzU2NzIxMzV8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1770869731843-bd36aa92403c?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZmlsaW5nJTIwY2FiaW5ldHxlbnwwfHx8fDE3NzU2NzIxMzV8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption">Photo by <a href="https://unsplash.com/@worldtravelwithjean">J&#233;an B&#233;ller</a> on <a href="https://unsplash.com">Unsplash</a></figcaption></figure></div><div><hr></div><p>Andrej Karpathy published <a href="https://gist.github.com/karpathy/442a6bf555914893e9891c11519de94f">a gist last week</a> describing a pattern he calls &#8220;LLM Wiki.&#8221; The idea: an LLM that builds and maintains a personal knowledge base &#8212; interlinked markdown files, structured summaries, cross-references updated automatically. You curate the sources and ask the questions. The LLM does the bookkeeping. Five thousand stars in four days.</p><p>His key analogy: &#8220;<a href="https://www.mandalivia.com/obsidian/">Obsidian</a> is the IDE; the LLM is the programmer; the wiki is the codebase.&#8221;</p><p>It&#8217;s a sharp proposal. It&#8217;s also one that a German sociologist named <a href="https://en.wikipedia.org/wiki/Niklas_Luhmann">Niklas Luhmann</a> would have recognized immediately &#8212; from the system of 90,000 handwritten index cards he maintained for forty-five years, starting in 1953. Luhmann&#8217;s <a href="https://en.wikipedia.org/wiki/Zettelkasten">Zettelkasten</a> is similar to what Karpathy describes: interlinked notes, cross-references, a persistent structure where knowledge compounds over time. He produced seventy books from it. The architecture wasn&#8217;t the hard part. The filing was.</p><p>Between Luhmann and Karpathy, an entire community spent decades working on this problem &#8212; <a href="https://en.wikipedia.org/wiki/As_We_May_Think">Vannevar Bush&#8217;s Memex</a> in 1945, the tools-for-thought movement, Roam Research and Obsidian, Tiago Forte&#8217;s <em><a href="https://www.buildingasecondbrain.com/">Building a Second Brain</a></em> in 2022. Karpathy walked into a room that&#8217;s been full for decades. But he brought something new through the door.</p><h2>What he got right</h2><p>The thing that kills every personal knowledge system isn&#8217;t the architecture &#8212; it&#8217;s the upkeep. Updating cross-references when your thinking evolves, keeping summaries current, noticing when something you wrote six months ago now contradicts what you learned last week. Most people who start a second brain quit within months. The bookkeeping grows faster than the value, and one day you stop opening the app.</p><p>Karpathy&#8217;s solution &#8212; hand the maintenance to an LLM &#8212; is pragmatic. If you were never going to build the habit yourself, having an agent build a compounding knowledge base for you is vastly better than having nothing at all.</p><p>But his framing reveals an assumption: &#8220;You never write the wiki yourself.&#8221; The human curates sources and asks questions. The LLM writes, files, and maintains. You read it; the LLM writes it.</p><p>For people starting from zero, that division makes sense. But there&#8217;s another group &#8212; people who already built the habit, who already have a second brain they&#8217;ve been writing in for years. For them, the opportunity looks different.</p><h2>The shared surface</h2><p>I&#8217;ve kept a second brain in Obsidian for nearly five years &#8212; around 2,400 notes, wikilinked together, semantically searchable. I started building it before AI entered the picture, for the same reason people have always built these systems: I wanted to externalize my thinking so I could work with it.</p><p>When I read Karpathy&#8217;s proposal, I recognized the architecture immediately &#8212; but from the other direction. He was asking how to give an agent persistent memory. I&#8217;d already answered that question by accident, by handing the agent the memory system I&#8217;d built for myself.</p><p>The move wasn&#8217;t &#8220;LLM builds a wiki.&#8221; It was &#8220;come work where I already work.&#8221;</p><p>Karpathy&#8217;s framing is that you read the wiki and the LLM writes it. In my vault, we both write to it. The agent logs entries to my notes, and I read them the next morning. I update a project file with notes from a call, and the agent picks up the new context in its next session without my having to explain anything. When a family member emails an update about a medical appointment, the agent processes it into my file in the vault &#8212; the same file I open when I&#8217;m at the next appointment.</p><p>The project file carries the chronology &#8212; who did what, when, what&#8217;s next &#8212; and both of us contribute to it. Neither of us has to re-explain context over chat because the context lives in the notes we&#8217;re both already using.</p><p>This only works because the vault is my actual workspace, not a reference library I consult occasionally. If the agent wrote to a separate folder I never opened &#8212; the way most AI memory systems work &#8212; I&#8217;d never see what it got wrong, never catch a stale fact or a misunderstood priority. The errors would compile quietly into the agent&#8217;s model of my life, looking authoritative. A shared brain only stays honest when both parties are working in it.</p><h2>What changes</h2><p>A wiki the LLM maintains for you is an archive &#8212; historical and well-organized. But it&#8217;s the LLM&#8217;s understanding of your world, written in the LLM&#8217;s voice, looking backward. You visit it when you have a question about what happened.</p><p>A vault you both work in is a whiteboard. I start my morning and the agent already knows what I was working on yesterday, what&#8217;s blocked, what changed overnight &#8212; not because I briefed it, but because it was there. I don&#8217;t re-explain context. I don&#8217;t paste in background. I pick up a thread and the agent picks up the other end &#8212; like a teammate who was in the room yesterday and will be in the room tomorrow.</p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption"><em>I write about what happens when AI stops being a tool and starts being a collaborator. If that&#8217;s a question you&#8217;re thinking about too, subscribe.</em></p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p><p></p>]]></content:encoded></item><item><title><![CDATA[I Made This]]></title><description><![CDATA[When creative barriers drop, a rush follows. What happens after is the interesting part.]]></description><link>https://blog.boxcars.ai/p/i-made-this</link><guid isPermaLink="false">https://blog.boxcars.ai/p/i-made-this</guid><dc:creator><![CDATA[Tabrez Syed]]></dc:creator><pubDate>Thu, 02 Apr 2026 13:00:57 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1759572095317-3a96f9a98e2b?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHx0LXNoaXJ0JTIwZGVzaWdufGVufDB8fHx8MTc3NTAyNzM3Mnww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1759572095317-3a96f9a98e2b?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHx0LXNoaXJ0JTIwZGVzaWdufGVufDB8fHx8MTc3NTAyNzM3Mnww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1759572095317-3a96f9a98e2b?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHx0LXNoaXJ0JTIwZGVzaWdufGVufDB8fHx8MTc3NTAyNzM3Mnww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1759572095317-3a96f9a98e2b?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHx0LXNoaXJ0JTIwZGVzaWdufGVufDB8fHx8MTc3NTAyNzM3Mnww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1759572095317-3a96f9a98e2b?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHx0LXNoaXJ0JTIwZGVzaWdufGVufDB8fHx8MTc3NTAyNzM3Mnww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1759572095317-3a96f9a98e2b?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHx0LXNoaXJ0JTIwZGVzaWdufGVufDB8fHx8MTc3NTAyNzM3Mnww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1759572095317-3a96f9a98e2b?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHx0LXNoaXJ0JTIwZGVzaWdufGVufDB8fHx8MTc3NTAyNzM3Mnww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" width="4703" height="3134" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1759572095317-3a96f9a98e2b?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHx0LXNoaXJ0JTIwZGVzaWdufGVufDB8fHx8MTc3NTAyNzM3Mnww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:3134,&quot;width&quot;:4703,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;Two t-shirts, black and light green, with cotton stems.&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="Two t-shirts, black and light green, with cotton stems." title="Two t-shirts, black and light green, with cotton stems." srcset="https://images.unsplash.com/photo-1759572095317-3a96f9a98e2b?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHx0LXNoaXJ0JTIwZGVzaWdufGVufDB8fHx8MTc3NTAyNzM3Mnww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1759572095317-3a96f9a98e2b?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHx0LXNoaXJ0JTIwZGVzaWdufGVufDB8fHx8MTc3NTAyNzM3Mnww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1759572095317-3a96f9a98e2b?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHx0LXNoaXJ0JTIwZGVzaWdufGVufDB8fHx8MTc3NTAyNzM3Mnww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1759572095317-3a96f9a98e2b?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHx0LXNoaXJ0JTIwZGVzaWdufGVufDB8fHx8MTc3NTAyNzM3Mnww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption">Photo by <a href="https://unsplash.com/@tonnnyj">tian dayong</a> on <a href="https://unsplash.com">Unsplash</a></figcaption></figure></div><p></p><p>There was a website in the early 2000s called <a href="https://www.threadless.com/">Threadless</a> where anyone could submit a t-shirt design. The community voted, and the winners got printed. That was the whole thing.</p><p>But the feeling was something else. You had an idea on Tuesday and strangers were wearing it by next month. Glenn Jones, a graphic designer from New Zealand, won 21 times and eventually quit his fifteen-year career as a creative director to sell his own designs. &#8220;I didn&#8217;t want to be left wondering,&#8221; he said. The prize money wasn&#8217;t the point. Seeing his design on a shirt someone across the world had chosen to wear was.</p><p>The barrier between &#8220;I have an idea&#8221; and &#8220;I made a thing&#8221; had collapsed, and people poured through.</p><p>When Apple started shipping <a href="https://www.apple.com/garageband/">GarageBand</a> on every new Mac in 2004, the same thing happened to music. Anyone who wanted to could lay down a beat and mix a track without booking studio time. Most people who opened it made one song, played it for a friend, and never opened it again. Nobody cared. The point was the jolt of <em>I can do this</em>.</p><p>Grimes, a university student in Montreal, got a friend to show her the software and started making what she later called &#8220;<a href="https://www.npr.org/2016/04/27/455769676/feeling-this-a-conversation-with-grimes">terrible, terrible songs</a>&#8220; using the built-in synths. She kept going. A couple years later she recorded <em><a href="https://en.wikipedia.org/wiki/Visions_(Grimes_album)">Visions</a></em> in her apartment over three weeks, still on GarageBand, and won a Juno Award. Then she was headlining festivals.</p><p>Steve Lacy was <a href="https://www.musicradar.com/news/steve-lacy-garageband-iphone">17 and still in high school in Compton</a> when he plugged a guitar into his iPhone and started recording parts for The Internet&#8217;s <em>Ego Death</em> on the GarageBand app. The album got a <a href="https://en.wikipedia.org/wiki/Ego_Death_(album)">Grammy nomination</a>, and Lacy kept recording on that phone long enough for his single &#8220;<a href="https://en.wikipedia.org/wiki/Bad_Habit_(Steve_Lacy_song)">Bad Habit</a>&#8220; to hit number one on the Billboard Hot 100 a few years later.</p><p>AI coding tools are in this phase right now. Every week my feed fills with screenshots of apps someone built in an afternoon &#8212; a habit tracker, a recipe tool, a game their kid wanted. I&#8217;ve been building them myself. Not because I need another app, but because I can, and that feeling hasn&#8217;t gotten old yet. &#8220;I made this.&#8221; Same jolt. Different canvas.</p><h2>The fork</h2><p>Here&#8217;s the pattern after the rush. Millions of people felt that jolt of possibility when they first opened GarageBand, and most of them never opened it again. That&#8217;s not failure, and it&#8217;s not a waste. But for most people the rush was about the novelty of the tool, not the beginning of a new identity.</p><p>For some people, though, the rush turns out to be a discovery. Grimes and Lacy didn&#8217;t know they were musicians until the barrier dropped and they walked through it. The tool didn&#8217;t give them talent. It gave them a way to discover their art. What separated them from the millions who moved on wasn&#8217;t discipline or seriousness. It was recognition, a feeling that this new thing they could suddenly do was somehow already theirs.</p><h2>The on-ramp</h2><p>Most of the apps people are building right now will stop working when the dependencies break. That&#8217;s fine. The rush was never really about the app. But somewhere in that flood, someone is finding out they&#8217;re a builder &#8212; month one of something nobody sees coming.</p><p>The Threadless shirt is in the back of the closet. The GarageBand track never got a second listen. And Steve Lacy&#8217;s cracked iPhone &#8212; the one he used to record on GarageBand as a teenager &#8212; is <a href="https://hypebeast.com/2022/12/steve-lacy-2012-iphone-smithsonian-entertainment-nation-exhibit">on display at the Smithsonian</a>. Not every GarageBand project ends up in a museum. But you can&#8217;t get to the museum without the project.</p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption"><em>I made this article with Claude. If you&#8217;re curious about what human-AI   collaboration actually looks like as it evolves, subscribe &#8212; I write about it  weekly.</em></p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p><p></p><p></p>]]></content:encoded></item><item><title><![CDATA[The Promotion I Missed]]></title><description><![CDATA[What managing a new hire taught me about working with AI]]></description><link>https://blog.boxcars.ai/p/the-promotion-i-missed</link><guid isPermaLink="false">https://blog.boxcars.ai/p/the-promotion-i-missed</guid><dc:creator><![CDATA[Tabrez Syed]]></dc:creator><pubDate>Thu, 26 Mar 2026 13:03:22 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1516321318423-f06f85e504b3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxpbnRlcm58ZW58MHx8fHwxNzc0NTAwMjc4fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1516321318423-f06f85e504b3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxpbnRlcm58ZW58MHx8fHwxNzc0NTAwMjc4fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1516321318423-f06f85e504b3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxpbnRlcm58ZW58MHx8fHwxNzc0NTAwMjc4fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1516321318423-f06f85e504b3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxpbnRlcm58ZW58MHx8fHwxNzc0NTAwMjc4fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1516321318423-f06f85e504b3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxpbnRlcm58ZW58MHx8fHwxNzc0NTAwMjc4fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1516321318423-f06f85e504b3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxpbnRlcm58ZW58MHx8fHwxNzc0NTAwMjc4fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1516321318423-f06f85e504b3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxpbnRlcm58ZW58MHx8fHwxNzc0NTAwMjc4fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" width="5184" height="3456" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1516321318423-f06f85e504b3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxpbnRlcm58ZW58MHx8fHwxNzc0NTAwMjc4fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:3456,&quot;width&quot;:5184,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;person using laptop&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="person using laptop" title="person using laptop" srcset="https://images.unsplash.com/photo-1516321318423-f06f85e504b3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxpbnRlcm58ZW58MHx8fHwxNzc0NTAwMjc4fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1516321318423-f06f85e504b3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxpbnRlcm58ZW58MHx8fHwxNzc0NTAwMjc4fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1516321318423-f06f85e504b3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxpbnRlcm58ZW58MHx8fHwxNzc0NTAwMjc4fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1516321318423-f06f85e504b3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxpbnRlcm58ZW58MHx8fHwxNzc0NTAwMjc4fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption">Photo by <a href="https://unsplash.com/@johnishappysometimes">John</a> on <a href="https://unsplash.com">Unsplash</a></figcaption></figure></div><div><hr></div><p>I was writing a skill file for Claude Code when a line in Anthropic&#8217;s documentation stopped me. It said to explain <em>why</em> the skill was needed &#8212; not just what it should do, but why it existed in the first place.</p><p>I&#8217;d been writing prompts as step-by-step procedures &#8212; edge cases spelled out, fallback behaviors for when things went wrong. The kind of detail you give someone when you don&#8217;t trust them to figure it out on their own.</p><p>But here was the documentation saying: just tell it why.</p><p>I knew this moment. I&#8217;d been on the other side of it before &#8212; not with software.</p><h2>Kate</h2><p>I hired Kate (not her real name) straight out of college. Computer science degree, disciplined, the kind of work ethic where you&#8217;d assign something Friday afternoon and find it done by Monday morning. But she needed the task spelled out &#8212; not because she wasn&#8217;t smart, but because she was new. No different than I had been at her age. So I gave her detailed specs, walked through edge cases, flagged where things could go wrong. She executed well within those boundaries, and the boundaries were tight.</p><p>Anyone who&#8217;s managed people knows what happened next. The instructions loosened. Her questions changed &#8212; not &#8220;how should I do this?&#8221; but &#8220;are we solving the right problem?&#8221; The projects changed too: early on it was &#8220;implement this feature, here are the requirements,&#8221; and later it was &#8220;this part of the system isn&#8217;t working for users &#8212; figure out why.&#8221;</p><p>At some point my 1:1s with Kate stopped being about what to do and started being about why we were doing it. Context, priorities, the business problem behind the technical one. I was managing her the way my best managers had managed me &#8212; with intent, not instruction.</p><p>And then Kate started managing others. She onboarded new hires with the same careful detail I&#8217;d once given her &#8212; spelling out the specs, walking through edge cases, flagging where things could go wrong. The promotion, when it came, was a formality. She&#8217;d been operating at that level for months. We just hadn&#8217;t updated the title yet.</p><h2>Claude</h2><p>I started working with Claude early on, back when the model couldn&#8217;t stay focused for long. Its context window was small and it would lose the thread of a conversation halfway through. So I learned to spell things out. I&#8217;d provide examples of the output I wanted so it could mimic the pattern. I&#8217;d write &#8220;let&#8217;s think step by step&#8221; because it couldn&#8217;t reason unless you told it to. I&#8217;d open with &#8220;act as a senior software engineer&#8221; to narrow the field of possible responses. The boundaries were tight &#8212; just like they&#8217;d been with Kate. And like Kate, it executed well within them.</p><p>Anyone who&#8217;s been using these tools knows what happened next. The instructions loosened. &#8220;Let&#8217;s think step by step&#8221; &#8212; the technique that defined an era of prompting, the thing people <a href="https://fortune.com/2025/05/07/prompt-engineering-200k-six-figure-role-now-obsolete-thanks-to-ai/">paid $335,000 a year</a> to get right &#8212; now <a href="https://gail.wharton.upenn.edu/research-and-insights/tech-report-chain-of-thought/">barely improves performance</a>; on some models it actually hurts. The model internalized the technique the way Kate internalized project management. It just does it now, without being told. My prompts changed the way Kate&#8217;s questions had changed &#8212; less &#8220;here&#8217;s exactly what to do&#8221; and more &#8220;here&#8217;s what&#8217;s going wrong and why it matters.&#8221;</p><p>And then Claude started managing others. I used to open multiple sessions myself &#8212; one for writing, one for review, one for research. Now Claude spins up subagents on its own, delegating work with care.</p><h2>The Recognition</h2><p>Since December, I find myself in new territory with the models. The latest step up feels like a promotion, but like with Kate, it&#8217;s taking some reorientation.</p><p>With Kate, the hard part wasn&#8217;t her readiness &#8212; it was mine. I kept handing her detailed specs after she&#8217;d outgrown them, still seeing the new hire I&#8217;d onboarded instead of the senior engineer she&#8217;d become. The unlock wasn&#8217;t just her leveling up. It was me noticing that she had.</p><p>I went back to my skill file. This time, instead of spelling out procedures and edge cases, I found myself doing what every good manager eventually learns to do: starting with the why. What problem I was trying to solve. What good looked like. The kind of context you give someone when you trust them to figure out the how.</p><p>Ethan Mollick <a href="https://www.oneusefulthing.org/p/on-boarding-your-ai-intern">wrote in 2023</a> that we should treat AI like an intern. It was good advice at the time. But interns don&#8217;t stay interns.</p><p>Kate went on to become a director. She&#8217;s worked at companies I&#8217;ve only read about, led teams bigger than any I&#8217;ve built. If I&#8217;m being honest, I could see myself working for her.</p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption"><em>If you enjoyed this, subscribe for weekly essays on working alongside AI as it grows up. </em></p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p><p></p>]]></content:encoded></item><item><title><![CDATA[The Poorly Lit Factory]]></title><description><![CDATA[What a tent in a Tesla parking lot tells us about the future of AI-generated code]]></description><link>https://blog.boxcars.ai/p/the-poorly-lit-factory</link><guid isPermaLink="false">https://blog.boxcars.ai/p/the-poorly-lit-factory</guid><dc:creator><![CDATA[Tabrez Syed]]></dc:creator><pubDate>Thu, 19 Mar 2026 13:04:19 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1567789884554-0b844b597180?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyfHxyb2JvdCUyMGZhY3Rvcnl8ZW58MHx8fHwxNzczOTA4NTAyfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1567789884554-0b844b597180?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyfHxyb2JvdCUyMGZhY3Rvcnl8ZW58MHx8fHwxNzczOTA4NTAyfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1567789884554-0b844b597180?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyfHxyb2JvdCUyMGZhY3Rvcnl8ZW58MHx8fHwxNzczOTA4NTAyfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1567789884554-0b844b597180?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyfHxyb2JvdCUyMGZhY3Rvcnl8ZW58MHx8fHwxNzczOTA4NTAyfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1567789884554-0b844b597180?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyfHxyb2JvdCUyMGZhY3Rvcnl8ZW58MHx8fHwxNzczOTA4NTAyfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1567789884554-0b844b597180?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyfHxyb2JvdCUyMGZhY3Rvcnl8ZW58MHx8fHwxNzczOTA4NTAyfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1567789884554-0b844b597180?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyfHxyb2JvdCUyMGZhY3Rvcnl8ZW58MHx8fHwxNzczOTA4NTAyfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" width="6000" height="4000" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1567789884554-0b844b597180?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyfHxyb2JvdCUyMGZhY3Rvcnl8ZW58MHx8fHwxNzczOTA4NTAyfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:4000,&quot;width&quot;:6000,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;gray vehicle being fixed inside factory using robot machines&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="gray vehicle being fixed inside factory using robot machines" title="gray vehicle being fixed inside factory using robot machines" srcset="https://images.unsplash.com/photo-1567789884554-0b844b597180?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyfHxyb2JvdCUyMGZhY3Rvcnl8ZW58MHx8fHwxNzczOTA4NTAyfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1567789884554-0b844b597180?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyfHxyb2JvdCUyMGZhY3Rvcnl8ZW58MHx8fHwxNzczOTA4NTAyfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1567789884554-0b844b597180?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyfHxyb2JvdCUyMGZhY3Rvcnl8ZW58MHx8fHwxNzczOTA4NTAyfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1567789884554-0b844b597180?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyfHxyb2JvdCUyMGZhY3Rvcnl8ZW58MHx8fHwxNzczOTA4NTAyfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption">Photo by <a href="https://unsplash.com/@lennykuhne">Lenny Kuhne</a> on <a href="https://unsplash.com">Unsplash</a></figcaption></figure></div><p>At the foot of Mount Fuji, robots build other robots in total darkness. No lights &#8212; the machines don&#8217;t need to see. No heating, no air conditioning either. &#8220;Not only is it lights-out,&#8221; a <a href="https://www.bloomberg.com/news/features/2017-10-18/this-company-s-robots-are-making-everything-and-reshaping-the-world">FANUC</a> executive once explained, &#8220;we turn off the air conditioning and heat too.&#8221; The yellow arms move with precision through pitch black, producing roughly fifty new robots every twenty-four hours, sometimes running unsupervised for weeks at a stretch.</p><p>The industry calls this a &#8220;dark factory&#8221; &#8212; not metaphorically. It&#8217;s literally dark because humans aren&#8217;t there, and robots don&#8217;t care.</p><p>In January 2026, entrepreneur Dan Shapiro <a href="https://www.danshapiro.com/blog/2026/01/the-five-levels-from-spicy-autocomplete-to-the-software-factory/">published a framework</a> mapping AI-assisted software development onto five levels &#8212; borrowing the concept directly from FANUC&#8217;s lightless factory floor. At one end, AI is &#8220;spicy autocomplete.&#8221; At the other, it&#8217;s a dark factory: specs go in, working software comes out, no human writes or reviews a line of code.</p><p>At least one team claims to already be there.</p><h2>Level Five</h2><p>What does a dark factory look like when the factory floor is an IDE?</p><p>Right now, most teams using AI to write software still keep the lights on. A developer prompts an AI to generate a function, reads what comes back, adjusts the prompt, tries again. Or an AI agent writes a pull request and a human reviews it &#8212; scanning the diff, checking the logic, clicking approve. The AI does the typing, but a human is always in the room, either steering or inspecting. In Shapiro&#8217;s framework, this is Level 2 or 3. The lights are dimmed, maybe, but someone is always watching.</p><p>Last July, StrongDM&#8217;s CTO Justin McCarthy formed a three-person team and turned the lights off. Their charter had two rules. The first: code must not be written by humans. The second: code must not be reviewed by humans. Not &#8220;humans can review if they want to.&#8221; Must not. The rules aren&#8217;t constraints born from laziness &#8212; they&#8217;re a forcing function. If no human is allowed to touch the code, you have to solve every quality problem some other way.</p><p>By the time Simon Willison <a href="https://simonwillison.net/2026/Feb/7/software-factory/">visited their lab</a> in October, three people had produced thirty-two thousand lines of production software without a single line written or reviewed by a human hand. Willison watched a demo where a developer had a complex application running on localhost &#8212; something that looked like Google Sheets but with real backend logic, a working frontend, actual functionality. The entire thing had been produced by AI agents operating against human-defined specifications. Willison called it <a href="https://simonwillison.net/2026/Feb/7/software-factory/">&#8220;the most ambitious form of AI-assisted software development I&#8217;ve seen yet.&#8221;</a></p><p>But the ambition raises an obvious question. If no human writes the code and no human reviews it, how do you know it works?</p><h2>All Models Are Wrong</h2><p>McCarthy&#8217;s team answered that question by building a world.</p><p>Their software talks to Slack, Jira, Okta, Google Docs in production &#8212; so they built replicas of all of them. Not mocks that return canned responses, but stateful behavioral clones. Delete a Slack channel in the replica, and it stays deleted; the next time your code tries to post there, it gets the same &#8220;channel not found&#8221; error it would get from the real thing. Change a user&#8217;s role in the Okta replica, and five minutes later the Jira replica blocks their access, just like the real services would.</p><p>The AI agents write code, deploy it into this digital universe, and see what happens. They run thousands of scenarios &#8212; end-to-end user stories that the team keeps hidden from the coding agents, like holdout sets in machine learning. The agents don&#8217;t know what the tests are. They have to bumble through the simulated world, interact with the replicas, and iterate until the software actually works against conditions it wasn&#8217;t specifically told to expect. When something breaks, the agents adjust and try again. The feedback comes from the universe itself.</p><p>Willison saw why this mattered. Building a high-fidelity clone of a complex SaaS application, he <a href="https://simonwillison.net/2026/Feb/7/software-factory/">wrote</a>, &#8220;was always possible, but never economically feasible&#8221; &#8212; until LLMs made it cheap enough to build at scale. But strip away the branding and what McCarthy&#8217;s team has built is integration testing. Thorough, high-fidelity, running at a scale that wasn&#8217;t economical before &#8212; but integration testing all the same.</p><p>And integration testing has a problem that no amount of scale solves. The tests are only as good as the model they run against. The statistician George Box put it simply in 1987: &#8220;All models are wrong, but some are useful.&#8221; McCarthy&#8217;s digital universe is a model &#8212; a good one, good enough to ship thirty-two thousand lines of production code on. But the map is not the territory. When the real Slack changes how it handles rate limits, or Okta tweaks an authentication flow, the model doesn&#8217;t know until something updates it. And in that gap between the model and reality, the dark factory is running full speed, producing code that works perfectly in a world that no longer quite exists.</p><p>The dream of full automation has crashed into the gap between model and reality before &#8212; and the most famous case left a billionaire building cars by hand in a tent.</p><h2>The Tent</h2><p>In 2016, Elon Musk described his vision for the Tesla Model 3 production line as &#8220;the machine that builds the machine.&#8221; The internal codename was the Alien Dreadnought &#8212; a factory so automated it would look inhuman. Robots would handle everything. The line would move so fast that air resistance on the parts would become a design constraint. Humans would only slow it down.</p><p>By 2018, the Alien Dreadnought was in ruins. Musk had automated tasks that didn&#8217;t need automating &#8212; complex conveyor systems for jobs a person could do in seconds, robotic arms trying to handle parts that varied just enough to jam the line. The Model 3 was supposed to roll off the line at five thousand cars a week. It was producing a fraction of that, and the company was <a href="https://www.cnbc.com/2019/07/15/tesla-workers-in-ga4-tent-describe-pressure-to-make-model-3-goals.html">burning through cash</a> at an unsustainable rate.</p><p>So Musk did something that would have been unthinkable two years earlier. In three weeks, his team erected a massive temporary structure &#8212; a tent, officially called GA4 &#8212; in the Fremont factory parking lot. Inside, humans assembled cars by hand. Not robots. People, working around the clock, doing the thing the perfect automated factory couldn&#8217;t do.</p><p>&#8220;Yes, excessive automation at Tesla was a mistake,&#8221; Musk <a href="https://techcrunch.com/2018/04/13/elon-musk-says-humans-are-underrated-calls-teslas-excessive-automation-a-mistake/">tweeted</a> on April 13, 2018. &#8220;To be precise, my mistake. Humans are underrated.&#8221;</p><p>It&#8217;s the kind of story that gets told as a cautionary tale &#8212; the hubris of full automation, the return of the human. But that&#8217;s not where the story ends. Tesla didn&#8217;t abandon the dream. They rebuilt the line incrementally, automating where it made sense, keeping humans where it didn&#8217;t. The Fremont factory today produces roughly half a million vehicles a year, far more automated than the tent but far less than the Alien Dreadnought imagined. Musk didn&#8217;t skip to lights-out in one leap. He got there &#8212; or closer to there &#8212; by working his way along the curve.</p><p>The tent was a point on the curve.</p><h2>The Poorly Lit Factory</h2><p>Everybody&#8217;s building toward the dark factory now. Cursor says <a href="https://cursor.com/blog/scaling-agents">thirty-five percent</a> of its own merged pull requests come from autonomous agents; Cognition claims their AI developer Devin merges <a href="https://cognition.ai/blog/devin-annual-performance-review-2025">sixty-seven percent</a> of its PRs. But companies selling AI tools have an interest in claiming the factory is going dark &#8212; and independent testing puts Devin&#8217;s success rate on open-ended tasks closer to fifteen percent. That gap between vendor stats and outside measurement tells you something about where we actually are. Then again, companies with no AI product to sell are seeing real results too: Stripe&#8217;s internal system <a href="https://stripe.dev/blog/minions-stripes-one-shot-end-to-end-coding-agents">produces over a thousand agent-written PRs a week</a> &#8212; though every one of them is still reviewed by a human before it merges.</p><p>Nobody&#8217;s fully dark yet. Most teams are somewhere between Shapiro&#8217;s Level 2 and Level 4 &#8212; the lights dimmed but not off, humans still in the loop at some point in the chain. McCarthy&#8217;s team at StrongDM may be the furthest along, and even they depend on a model of the world that&#8217;s only as current as its last update.</p><p>Maybe that&#8217;s fine. Maybe the dark factory was always an asymptote &#8212; a limit we approach but never quite reach. FANUC still has humans maintaining the lines at Mount Fuji. Tesla rebuilt toward automation incrementally after the tent, and Fremont today is neither the Alien Dreadnought nor the parking lot.</p><p>The thing that matters is a factory that works. A dark factory that fails when the parts come in slightly different than the simulation predicted isn&#8217;t useful &#8212; no matter how impressive the automation looks in a demo. And if keeping a few lights on is what makes it run, then a poorly lit factory is the better factory.</p><p>There will always be people trying to turn that last light off. That&#8217;s fine &#8212; that&#8217;s how the asymptote moves. But the work worth watching is what&#8217;s getting built while the lights are still on.</p><div><hr></div><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption"><em>The lights are dimming across the software industry. Subscribe to watch what stays lit</em>.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p><p></p>]]></content:encoded></item><item><title><![CDATA[The Dream of the Serpent]]></title><description><![CDATA[AI solved an open math problem and outperformed a world-class engineer. The process looked a lot like genius.]]></description><link>https://blog.boxcars.ai/p/the-dream-of-the-serpent</link><guid isPermaLink="false">https://blog.boxcars.ai/p/the-dream-of-the-serpent</guid><dc:creator><![CDATA[Tabrez Syed]]></dc:creator><pubDate>Thu, 12 Mar 2026 13:02:51 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!7j9c!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff17a5554-b891-4291-b903-7f32a18261d8_1536x1024.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!7j9c!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff17a5554-b891-4291-b903-7f32a18261d8_1536x1024.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!7j9c!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff17a5554-b891-4291-b903-7f32a18261d8_1536x1024.png 424w, https://substackcdn.com/image/fetch/$s_!7j9c!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff17a5554-b891-4291-b903-7f32a18261d8_1536x1024.png 848w, https://substackcdn.com/image/fetch/$s_!7j9c!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff17a5554-b891-4291-b903-7f32a18261d8_1536x1024.png 1272w, https://substackcdn.com/image/fetch/$s_!7j9c!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff17a5554-b891-4291-b903-7f32a18261d8_1536x1024.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!7j9c!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff17a5554-b891-4291-b903-7f32a18261d8_1536x1024.png" width="1456" height="971" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/f17a5554-b891-4291-b903-7f32a18261d8_1536x1024.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:971,&quot;width&quot;:1456,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:2754766,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:&quot;https://blog.boxcars.ai/i/190652401?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff17a5554-b891-4291-b903-7f32a18261d8_1536x1024.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!7j9c!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff17a5554-b891-4291-b903-7f32a18261d8_1536x1024.png 424w, https://substackcdn.com/image/fetch/$s_!7j9c!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff17a5554-b891-4291-b903-7f32a18261d8_1536x1024.png 848w, https://substackcdn.com/image/fetch/$s_!7j9c!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff17a5554-b891-4291-b903-7f32a18261d8_1536x1024.png 1272w, https://substackcdn.com/image/fetch/$s_!7j9c!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ff17a5554-b891-4291-b903-7f32a18261d8_1536x1024.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>In 1865, the German chemist August Kekul&#233; was stuck. He&#8217;d spent years trying to work out the structure of benzene &#8212; a molecule that chemists knew the ingredients of but couldn&#8217;t figure out the shape. Carbon and hydrogen atoms in the right quantities, but no arrangement anyone proposed could explain how they held together. Kekul&#233; had been turning the problem over for so long it followed him into his sleep.</p><p>As the story goes, one evening he dozed off by the fire and dreamed of atoms dancing and twisting into chains. Then one of the chains curled around and seized its own tail &#8212; a serpent forming a ring. He woke up and spent the rest of the night working out the implications. Benzene wasn&#8217;t a chain. It was a ring. The ouroboros &#8212; the ancient image of a serpent eating itself &#8212; had revealed one of the foundational structures of organic chemistry.</p><p>It&#8217;s a great story, and it&#8217;s the kind of story we love to tell about problem-solving &#8212; the answer arrives in a flash, delivered by the subconscious as a gift, genius as something that happens <em>to</em> you rather than something you grind out. We conveniently forget that Kekul&#233; had been grinding for years before the dream arrived.</p><p>The common criticism of AI follows a similar logic. AI is just autocomplete &#8212; it can remix what it&#8217;s seen, predict the next likely word, maybe even sound convincing, but it can&#8217;t <em>solve</em> anything new. It doesn&#8217;t have insight. It can&#8217;t have that Kekul&#233; moment where the pieces suddenly fall into place. It&#8217;s a pattern-matching engine, not a mind that can discover.</p><p>It&#8217;s a reasonable position. But last week, two things happened that made me wonder whether we&#8217;ve been too sure about what &#8220;discovery&#8221; requires.</p><h2>The Mathematician</h2><p><a href="https://en.wikipedia.org/wiki/Donald_Knuth">Donald Knuth</a> is not the kind of person who gets excited about AI. A Turing Award winner and the author of <em>The Art of Computer Programming</em> &#8212; the textbook I used in my own computer science program in college, and still the definitive reference in the field &#8212; Knuth is often called the father of algorithm analysis. He has been openly skeptical about the productivity of large language models.</p><p>So when Knuth <a href="https://cs.stanford.edu/~knuth/papers/claude-cycles.pdf">published a note</a> on Stanford&#8217;s website last week, what he described sounded almost like a Kekul&#233; moment &#8212; for a machine.</p><p>Knuth had been stuck for weeks on an open problem from his textbook: finding paths through a three-dimensional grid of points where each path visits every point exactly once, returns to its start, and shares no connections with the other paths. He&#8217;d solved it for small grids but couldn&#8217;t crack the general case. His friend fed the problem to <a href="https://www.anthropic.com/">Claude</a>, Anthropic&#8217;s AI model, and what came back wasn&#8217;t brute force. Claude recognized that the grid had a deeper mathematical structure &#8212; a kind of symmetry that Knuth&#8217;s original framing hadn&#8217;t exploited. It invented a way to decompose the grid into layers, then built serpentine patterns that wove through each layer in a way that satisfied all the constraints simultaneously. It reframed the problem, then solved the reframed version.</p><p>Knuth verified the mathematics himself and called the approach &#8220;remarkably creative.&#8221; Not just correct &#8212; creative. &#8220;It seems that I&#8217;ll have to revise my opinions about &#8216;generative AI&#8217; one of these days,&#8221; he wrote.</p><p>Now here&#8217;s the thing: Claude didn&#8217;t arrive at that solution in a flash. It worked through the problem over about an hour, trying different approaches, hitting dead ends, adjusting its framing each time. The structural insight that cracked the problem &#8212; the decomposition into layers, the serpentine patterns &#8212; emerged from that process of trying and revising. Not randomly, but not in a single leap either. More like a mind circling a problem, getting closer with each pass, until the right angle of approach comes into focus.</p><p>Which sounds a lot like what Kekul&#233;&#8217;s subconscious was probably doing while he slept &#8212; running variations on carbon structures, testing arrangements against what he knew about molecular bonding, until one arrangement clicked and surfaced as a dream about a serpent.</p><h2>The Engineer</h2><p>The same week, <a href="https://en.wikipedia.org/wiki/Andrej_Karpathy">Andrej Karpathy</a> &#8212; a founding member of OpenAI and former head of AI at Tesla &#8212; ran a different experiment.</p><p>Karpathy maintains <a href="https://github.com/karpathy/nanochat">nanochat</a>, an open-source project for training small language models from scratch. Think of it as a workbench for building AI &#8212; minimal, transparent, designed for tinkering. He&#8217;d spent months hand-tuning the system&#8217;s internal settings to squeeze out better performance, and he thought the project was well-optimized.</p><p>Then he gave an AI agent his code with a simple instruction &#8212; make it better &#8212; and left it running for two days.</p><p>What came back wasn&#8217;t just a list of minor tweaks. The agent noticed that a key part of the model&#8217;s attention mechanism was missing a component, making it too diffuse &#8212; a subtle architectural oversight, not an obvious bug. It found that certain parts of the model needed regularization Karpathy hadn&#8217;t applied, that settings he&#8217;d forgotten to tune were working against each other, and that the initialization values were off. Twenty real improvements in all, each one something Karpathy &#8212; after months of manual work &#8212; had missed.</p><p>Stacked together, they produced an <a href="https://x.com/karpathy/status/2031135152349524125">11% gain on the project&#8217;s key benchmark</a>. The <a href="https://github.com/karpathy/nanochat/commit/6ed7d1d82cee16c2e26f45d559ad3338447a6c1b">commit message</a> reads: &#8220;All of these improvements were developed by Claude running autonomously. I didn&#8217;t touch anything &#8212; incredible.&#8221;</p><p>&#8220;I am mildly surprised,&#8221; Karpathy <a href="https://x.com/karpathy/status/2031135152349524125">wrote</a>, &#8220;that my very first naive attempt already worked this well on top of what I thought was already a fairly manually well-tuned project.&#8221; From Karpathy, &#8220;mildly surprised&#8221; is the equivalent of shock.</p><p>But there&#8217;s something in the Karpathy case that goes beyond the Knuth story. Knuth&#8217;s problem was mathematics &#8212; AI solving a puzzle for humans. Karpathy&#8217;s problem was AI itself. An AI agent improving the process by which AI gets built. The improvements it found will feed into the next generation of models, which will be better at finding the next round of improvements.</p><p>&#8220;All LLM frontier labs will do this,&#8221; Karpathy wrote. &#8220;It&#8217;s the final boss battle.&#8221;</p><h2>The Serpent Eats Its Tail</h2><p>I <a href="https://blog.boxcars.ai/p/can-math-make-art">argued a while back</a> that what we call creativity is really search through a space of possibilities &#8212; and that the line between searching and creating is blurrier than we&#8217;d like to admit. Knuth&#8217;s case and Karpathy&#8217;s case didn&#8217;t settle that question, but they sharpened it. When an AI reframes a problem that stumped a Turing Award winner, or spots architectural flaws that one of the world&#8217;s best engineers missed, something is happening that doesn&#8217;t fit neatly into the &#8220;just autocomplete&#8221; box.</p><p>The Karpathy case is the one I keep thinking about, because of where it points. When AI solves a math problem, it&#8217;s doing something for us. When AI improves the system that builds AI &#8212; and those improvements feed into the next round &#8212; the loop starts to close. I <a href="https://blog.boxcars.ai/p/kluges-that-work-turning-pattern">wrote a few months ago</a> about early signs of this loop forming. Karpathy&#8217;s result suggests it&#8217;s forming faster than expected. And once an AI that improves AI training produces a better AI that&#8217;s even better at improving AI training &#8212; well, that&#8217;s the serpent eating its own tail. Kekul&#233; would recognize the shape.</p><div><hr></div><p></p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption"><em>AI is starting to solve problems we said it couldn&#8217;t &#8212; and improve itself in the process. Subscribe for weekly explorations of what that means for the rest of us</em>.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p><p>Related</p><div class="digest-post-embed" data-attrs="{&quot;nodeId&quot;:&quot;06e1a656-6747-4c8d-be81-b8bae92851ed&quot;,&quot;caption&quot;:&quot;\&quot;All GPT-3 has to do is to complete this. All it really does is predict the next word, it's autocomplete on steroids.\&quot; - Gary Marcus, 2021&quot;,&quot;cta&quot;:&quot;Read full story&quot;,&quot;showBylines&quot;:true,&quot;size&quot;:&quot;sm&quot;,&quot;isEditorNode&quot;:true,&quot;title&quot;:&quot;Beyond Autocomplete: Guiding LLMs to Deeper Reasoning&quot;,&quot;publishedBylines&quot;:[{&quot;id&quot;:130480501,&quot;name&quot;:&quot;Tabrez Syed&quot;,&quot;bio&quot;:&quot;Programmer turned product manager. Now working on rethinking apps in a world of AI.&quot;,&quot;photo_url&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/4c5a7001-14b2-4bd4-b916-b853eb8381fd_3000x3918.jpeg&quot;,&quot;is_guest&quot;:false,&quot;bestseller_tier&quot;:null}],&quot;post_date&quot;:&quot;2024-10-10T13:03:17.374Z&quot;,&quot;cover_image&quot;:&quot;https://images.unsplash.com/photo-1523120974498-9d764390d8e5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxNXx8a2V5Ym9hcmR8ZW58MHx8fHwxNzI4NDAzMzYzfDA&amp;ixlib=rb-4.0.3&amp;q=80&amp;w=1080&quot;,&quot;cover_image_alt&quot;:null,&quot;canonical_url&quot;:&quot;https://blog.boxcars.ai/p/beyond-autocomplete-guiding-llms&quot;,&quot;section_name&quot;:null,&quot;video_upload_id&quot;:null,&quot;id&quot;:150022134,&quot;type&quot;:&quot;newsletter&quot;,&quot;reaction_count&quot;:1,&quot;comment_count&quot;:0,&quot;publication_id&quot;:1438382,&quot;publication_name&quot;:&quot;BoxCars AI&quot;,&quot;publication_logo_url&quot;:&quot;https://substackcdn.com/image/fetch/$s_!lhIv!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa43b3a40-40f4-4f9d-b843-b52a17a80bb9_1024x1024.png&quot;,&quot;belowTheFold&quot;:true,&quot;youtube_url&quot;:null,&quot;show_links&quot;:null,&quot;feed_url&quot;:null}"></div>]]></content:encoded></item><item><title><![CDATA[When the Walls Come Down]]></title><description><![CDATA[What happens when the cost of replicating software drops to near zero?]]></description><link>https://blog.boxcars.ai/p/when-the-walls-come-down</link><guid isPermaLink="false">https://blog.boxcars.ai/p/when-the-walls-come-down</guid><dc:creator><![CDATA[Tabrez Syed]]></dc:creator><pubDate>Thu, 05 Mar 2026 14:03:23 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1544939514-aa98d908bc47?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxNXx8Y2FzdGxlfGVufDB8fHx8MTc3MjcwNTU4NHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1544939514-aa98d908bc47?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxNXx8Y2FzdGxlfGVufDB8fHx8MTc3MjcwNTU4NHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1544939514-aa98d908bc47?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxNXx8Y2FzdGxlfGVufDB8fHx8MTc3MjcwNTU4NHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1544939514-aa98d908bc47?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxNXx8Y2FzdGxlfGVufDB8fHx8MTc3MjcwNTU4NHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1544939514-aa98d908bc47?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxNXx8Y2FzdGxlfGVufDB8fHx8MTc3MjcwNTU4NHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1544939514-aa98d908bc47?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxNXx8Y2FzdGxlfGVufDB8fHx8MTc3MjcwNTU4NHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1544939514-aa98d908bc47?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxNXx8Y2FzdGxlfGVufDB8fHx8MTc3MjcwNTU4NHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" width="3264" height="2178" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1544939514-aa98d908bc47?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxNXx8Y2FzdGxlfGVufDB8fHx8MTc3MjcwNTU4NHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:2178,&quot;width&quot;:3264,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;brown concrete palace surrounded by body of water during daytime&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="brown concrete palace surrounded by body of water during daytime" title="brown concrete palace surrounded by body of water during daytime" srcset="https://images.unsplash.com/photo-1544939514-aa98d908bc47?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxNXx8Y2FzdGxlfGVufDB8fHx8MTc3MjcwNTU4NHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1544939514-aa98d908bc47?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxNXx8Y2FzdGxlfGVufDB8fHx8MTc3MjcwNTU4NHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1544939514-aa98d908bc47?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxNXx8Y2FzdGxlfGVufDB8fHx8MTc3MjcwNTU4NHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1544939514-aa98d908bc47?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxNXx8Y2FzdGxlfGVufDB8fHx8MTc3MjcwNTU4NHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption">Photo by <a href="https://unsplash.com/@clarky_523">Richard Clark</a> on <a href="https://unsplash.com">Unsplash</a></figcaption></figure></div><div><hr></div><p>The Theodosian Walls protected Constantinople for over a thousand years. Built in the fifth century, they were a triple line of fortification &#8212; an outer wall, an inner wall rising forty feet, and a moat &#8212; <a href="https://www.worldhistory.org/article/1180/1453-the-fall-of-constantinople/">stretching four miles across the only land approach to the city</a>. Armies came and broke against them for a millennium: Arab sieges, Bulgar assaults, Rus invasions, even the Fourth Crusade. The walls held. Siege after siege, century after century, the engineering held.</p><p>In April 1453, the Ottoman sultan Mehmed II positioned a new kind of weapon outside those walls &#8212; a massive bronze cannon called the Basilica, large enough that its stone projectiles could shatter sections of wall with a single shot. The bombardment went on for weeks, blasting the fortifications chunk by chunk into rubble. Defenders scrambled to patch the breaches each night with earth and timber, but by late May the city had fallen. Walls that had endured a thousand years of siege were undone in less than two months.</p><p>The walls hadn&#8217;t gotten weaker. The nature of the attack had changed. A technology had arrived that made the sheer <em>effort</em> of building thick, tall stone fortifications irrelevant &#8212; not because the walls were poorly constructed, but because they were brittle against a force they were never designed to absorb.</p><p>Something similar is playing out in software right now.</p><h2>The Wall Was Effort</h2><p>Some of the most durable business models in software aren&#8217;t built on patents or trade secrets. They&#8217;re built on effort &#8212; engineering complexity so deep that replicating it is, for all practical purposes, not worth attempting.</p><p>Consider <a href="https://vercel.com/">Vercel</a> and Next.js. Vercel gives away the framework for free. It&#8217;s open source &#8212; anyone can read the code, fork it, build with it. The business isn&#8217;t the framework. The business is the deployment platform, and the moat is how tightly the two are coupled. Routing, middleware, server-side rendering, image optimization &#8212; all of it <a href="https://blog.cloudflare.com/vinext/">works best, and in some cases only, on Vercel&#8217;s infrastructure</a>. The framework and the platform are stitched together through years of engineering, and that stitching is what makes it hard to leave.</p><p>The same pattern shows up across the industry. Microsoft&#8217;s Office formats are technically public &#8212; the .docx specification runs thousands of pages &#8212; but Google Docs and LibreOffice have spent years trying to render them faithfully, with interoperability that&#8217;s still imperfect. Adobe&#8217;s PDF spec is an open ISO standard, and yet most third-party viewers choke on edge cases that Adobe handles effortlessly. QuickBooks has decades of tax rules and jurisdiction-specific payroll logic baked into its codebase. In each case, the moat isn&#8217;t secrecy &#8212; the specifications are available, the code is sometimes even open source. The moat is the accumulated engineering effort required to match it.</p><p>The effort to replicate the coupling <em>was</em> the wall. Everyone could see it. Nobody could afford to climb it.</p><h2>The Clean Room</h2><p>Climbing an effort-wall through reimplementation is an old playbook. In 1982, <a href="https://www.allaboutcircuits.com/news/how-compaqs-clone-computers-skirted-ibms-patents-and-gave-rise-to-eisa/">Compaq wanted to build a computer compatible with the IBM PC</a>, but IBM&#8217;s moat was its BIOS &#8212; the firmware that made a PC an <em>IBM</em> PC. Compaq couldn&#8217;t copy it. So they reverse-engineered it in a clean room: one team disassembled IBM&#8217;s BIOS and documented every function call, every interrupt, every timing behavior, stripping it down to pure specification. A second team, completely isolated from the first, rebuilt the BIOS from scratch using only those specs. Nine months. <a href="https://www.ntari.org/post/how-clean-room-reverse-engineering-built-the-modern-tech-industry">$1 million</a>. And it worked &#8212; Compaq sold $150 million worth of PCs in their first year and broke IBM&#8217;s lock on the personal computer industry.</p><p>The clean room works. It&#8217;s just always been expensive enough that only the most determined competitors attempt it.</p><h2>$1,100</h2><p>Cloudflare had been one of those determined competitors. A project called <a href="https://opennext.js.org/">OpenNext</a> reverse-engineered Next.js&#8217;s build output to make it deployable on other platforms, but the approach was fragile &#8212; a game of catch-up that broke whenever Vercel changed something upstream. Cloudflare tried a ground-up reimplementation of the Next.js API themselves and failed. As they later put it, <a href="https://blog.cloudflare.com/vinext/">&#8220;a project like this would normally take a team of engineers months, if not years.&#8221;</a></p><p>Then, on the evening of February 13th, 2026, an engineering manager at Cloudflare opened <a href="https://docs.anthropic.com/en/docs/claude-code">Claude Code</a> and started again &#8212; rebuilding Next.js from scratch as a reimplementation of its API, built on <a href="https://vite.dev/">Vite</a>.</p><p>By the end of that first night, both the Pages Router and App Router had basic server-side rendering, middleware, server actions, and streaming working. Within three days the project could deploy to Cloudflare Workers with full client hydration, and by the end of the week it covered <a href="https://blog.cloudflare.com/vinext/">94% of the Next.js 16 API surface</a>, backed by 1,700 unit tests and 380 end-to-end tests.</p><p>One person. One week. $1,100 in API tokens.</p><p>The project is called <a href="https://github.com/cloudflare/vinext">vinext</a>, and it reimplements the full surface &#8212; routing, server rendering, React Server Components, middleware, caching, static export.</p><p>Cloudflare was careful to note the conditions that made this possible: <a href="https://blog.cloudflare.com/vinext/">&#8220;All of those things had to be true at the same time &#8212; well-documented target API, comprehensive test suite, solid build tool underneath, and a model that could actually handle the complexity.&#8221;</a> This wasn&#8217;t just &#8220;point an AI at code and press go.&#8221; It required a clear target, a way to verify correctness, and a human providing architecture and direction across more than 800 sessions.</p><p>The reaction was swift. Vercel&#8217;s CEO disclosed <a href="https://x.com/rauchg/status/2026864132423823499">seven security vulnerabilities</a> in the project. Critics coined a term for it &#8212; <a href="https://mbleigh.dev/posts/slop-forks/">&#8220;slop fork&#8221;</a> &#8212; a replication built by AI that&#8217;s rough, incomplete, not ready for production. And that&#8217;s probably fair today. vinext is experimental, and 94% coverage still leaves real gaps. But even an imperfect replication changes things, because the threat doesn&#8217;t have to succeed to make people rethink their defenses. Compaq&#8217;s clean room cost $1 million (in 1980s dollars) and nine months. Cloudflare&#8217;s cost $1,100 and a week. Even if vinext never ships to production, that price difference is hard to unsee.</p><h2>After the Walls</h2><p>After Constantinople fell, word spread across Europe. Commanders in fortified cities everywhere understood what had happened &#8212; a weapon had arrived that rendered their defenses, built over generations, suddenly uncertain. Some <a href="https://en.wikipedia.org/wiki/Bastion_fort">began redesigning</a>, lowering their walls, thickening them, angling the stone to deflect rather than absorb. Others reinforced what they had and hoped. Nobody knew yet what the right answer looked like.</p><p>There are a lot of companies sitting inside software fortifications right now, watching what happened to Vercel&#8217;s wall and wondering about their own. When tldraw&#8217;s founder <a href="https://github.com/tldraw/tldraw/issues/8082">joked about moving test files to a private repository</a> to prevent AI replication, the post went viral &#8212; not because of the proposal, but because of how plausible the threat felt.</p><p>The old walls are still standing. But everyone can hear the cannon.</p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption"><em>If you want to keep watching where the walls crack next, subscribe.</em></p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p>  </p><p></p><p></p>]]></content:encoded></item><item><title><![CDATA[A Website For Two]]></title><description><![CDATA[Your visitors are about to bring their own AI and that changes how companies build websites.]]></description><link>https://blog.boxcars.ai/p/a-website-for-two</link><guid isPermaLink="false">https://blog.boxcars.ai/p/a-website-for-two</guid><dc:creator><![CDATA[Tabrez Syed]]></dc:creator><pubDate>Thu, 26 Feb 2026 14:03:08 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1579713899713-bcd3efe713aa?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw3fHx4JTIwd2luZ3xlbnwwfHx8fDE3NzIwMzgxODh8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1579713899713-bcd3efe713aa?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw3fHx4JTIwd2luZ3xlbnwwfHx8fDE3NzIwMzgxODh8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1579713899713-bcd3efe713aa?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw3fHx4JTIwd2luZ3xlbnwwfHx8fDE3NzIwMzgxODh8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1579713899713-bcd3efe713aa?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw3fHx4JTIwd2luZ3xlbnwwfHx8fDE3NzIwMzgxODh8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1579713899713-bcd3efe713aa?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw3fHx4JTIwd2luZ3xlbnwwfHx8fDE3NzIwMzgxODh8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1579713899713-bcd3efe713aa?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw3fHx4JTIwd2luZ3xlbnwwfHx8fDE3NzIwMzgxODh8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1579713899713-bcd3efe713aa?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw3fHx4JTIwd2luZ3xlbnwwfHx8fDE3NzIwMzgxODh8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" width="6240" height="4160" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1579713899713-bcd3efe713aa?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw3fHx4JTIwd2luZ3xlbnwwfHx8fDE3NzIwMzgxODh8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:4160,&quot;width&quot;:6240,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;blue and yellow plane flying over rocky mountain during daytime&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="blue and yellow plane flying over rocky mountain during daytime" title="blue and yellow plane flying over rocky mountain during daytime" srcset="https://images.unsplash.com/photo-1579713899713-bcd3efe713aa?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw3fHx4JTIwd2luZ3xlbnwwfHx8fDE3NzIwMzgxODh8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1579713899713-bcd3efe713aa?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw3fHx4JTIwd2luZ3xlbnwwfHx8fDE3NzIwMzgxODh8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1579713899713-bcd3efe713aa?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw3fHx4JTIwd2luZ3xlbnwwfHx8fDE3NzIwMzgxODh8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1579713899713-bcd3efe713aa?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw3fHx4JTIwd2luZ3xlbnwwfHx8fDE3NzIwMzgxODh8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption">Photo by <a href="https://unsplash.com/@sushioutlaw">Brian McGowan</a> on <a href="https://unsplash.com">Unsplash</a></figcaption></figure></div><p>Why does Luke Skywalker bring R2-D2?</p><p>You remember Star Wars, right? The final scene where the rebellion sends fighter pilots to attack the Death Star. Every X-wing has onboard systems. The ship can fly itself well enough. But Luke and the other pilots bring their own droids. Why?</p><p>Luke doesn&#8217;t want a generic autopilot &#8212; he wants <em>his</em> droid, the one that knows how he flies, what he&#8217;s been through, what he&#8217;s likely to do next. R2-D2 doesn&#8217;t come with the plane. R2-D2 comes with Luke. Ship to ship, mission to mission, the relationship travels.</p><p>Last week I wrote about a version of this arriving on the web &#8212; WebMCP, a new browser standard that lets you bring your own AI agent into any website. Your copilot in someone else&#8217;s cockpit.</p><p>But plugging in is one thing. Working together inside is another. If R2 silently reroutes power and Luke doesn&#8217;t notice until the shields drop, that&#8217;s not collaboration &#8212; that&#8217;s a surprise. If Luke has to keep asking what R2 just did, they&#8217;re not flying together &#8212; they&#8217;re having a conversation about flying, which is slower and worse. The droid and the pilot need a shared way of working &#8212; an interface where every action is visible and every move makes sense to both.</p><p>That&#8217;s exactly where the web is now. WebMCP solves the plugging-in problem. Nobody has designed the cockpit for two yet.</p><h2>Your Droid, My Cockpit</h2><p>Consider a real estate site. Today, if the site is ambitious, it offers a chat assistant &#8212; the built-in autopilot. You can type &#8220;show me three-bedroom homes under $600k&#8221; and it filters the listings. Helpful enough. But the chat assistant is a stranger. So you end up explaining yourself from scratch: where you work, how long a commute you&#8217;ll tolerate, that your daughter likes her school and doesn&#8217;t want to switch. Talking to an AI bot on a website today is marginally better than interacting with the filters directly. Perhaps.</p><p>Now imagine arriving with your own agent &#8212; the one you&#8217;ve been mulling over buying a new house with for weeks, running financial comparisons, weighing pros and cons. You&#8217;re ready to look at actual listings, but rather than having the agent wait outside while you shop, you bring it into the site with you. The way you might take a personal stylist shopping at Neiman Marcus. (I haven&#8217;t, but I&#8217;m assuming that&#8217;s what you do.)</p><p>You say &#8220;show me some houses I might like&#8221; and your agent plugs into the site&#8217;s tools through WebMCP. It knows where your daughter goes to school and how much you hate your cross-town commute. It can look at each listing and calculate school drop-off times. It can scan photos and notice whether the yard is fenced for your dogs, or whether the guest room layout would work for when your mother-in-law visits, or whether there&#8217;s space in the back for your smoker. You don&#8217;t want a filter for &#8220;good schools.&#8221; You want homes within 15 minutes of Ridgetop Elementary. You never have to spell these things out on the site, because you&#8217;ve been spelling them out in conversation for weeks.</p><p>This is why someone brings R2-D2 instead of using the autopilot. Not because the autopilot can&#8217;t fly &#8212; but because R2 already knows the mission.</p><p>But websites were designed and built as single-player experiences. They break when you bring a second player. Your agent filters the listings, the page updates &#8212; results reorder, cards disappear, new ones surface at the top &#8212; and you&#8217;re not sure what just happened. So you open the chat panel and ask. The agent explains: filtered out properties with school ratings below 7, removed two that would put your commute over 40 minutes. Useful &#8212; but now you&#8217;re reading a paragraph in a chat window about changes that already happened on a page you&#8217;re still trying to parse.</p><p>Imagine if Luke had to stop flying and ask R2 to explain every change. He&#8217;d never have made it down the trench. What makes the X-wing cockpit work is that both pilot and droid can see the same instruments &#8212; shared gauges, shared readouts. The interface <em>is</em> the collaboration.</p><h2>The Board Is Truth</h2><p>I&#8217;ve been thinking about this a lot. What would it actually mean to redesign a website around the expectation that visitors bring their own agents?</p><p>I kept coming back to board games. Sit down at any board game and two or more players share a single surface. Someone takes a turn &#8212; buys a property, moves a piece, plays a card &#8212; and the board changes in front of everyone. You never have to ask &#8220;what did you just do?&#8221; You look at the board. It shows you. Conversation happens around the board &#8212; players negotiate, strategize, question each other&#8217;s moves &#8212; but the board is what&#8217;s real. Chat is commentary; the surface is truth.</p><p>The other analogy that stuck was the personal stylist. When you walk into a high-end store with your own stylist, the store doesn&#8217;t send a commissioned sales associate to compete with them. Instead, it provides the dressing room, the mirrors, the merchandise to work with. And because you&#8217;re shopping in <em>their</em> store, they can observe what catches your eye and help your stylist find more of it. The store becomes a collaboration surface &#8212; not between you and the store&#8217;s employee, but between you and the person you already trust.</p><p>A website for two works the same way. The site&#8217;s job isn&#8217;t to provide its own agent. It&#8217;s to provide the surface &#8212; the board &#8212; where you and your agent can work together. And because you&#8217;re on <em>their</em> site, they can make your agent&#8217;s job easier: exposing rich data, providing tools for comparison, letting the agent rearrange and annotate what&#8217;s on the surface.</p><p>To explore this idea, I built a demo to explore what this might look like. A real estate site, designed from the ground up as a website for two.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!OUPX!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb459c87-faf6-4829-81b3-ff8be4f2fe96_2018x2170.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!OUPX!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb459c87-faf6-4829-81b3-ff8be4f2fe96_2018x2170.png 424w, https://substackcdn.com/image/fetch/$s_!OUPX!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb459c87-faf6-4829-81b3-ff8be4f2fe96_2018x2170.png 848w, https://substackcdn.com/image/fetch/$s_!OUPX!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb459c87-faf6-4829-81b3-ff8be4f2fe96_2018x2170.png 1272w, https://substackcdn.com/image/fetch/$s_!OUPX!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb459c87-faf6-4829-81b3-ff8be4f2fe96_2018x2170.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!OUPX!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb459c87-faf6-4829-81b3-ff8be4f2fe96_2018x2170.png" width="590" height="634.5741758241758" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/eb459c87-faf6-4829-81b3-ff8be4f2fe96_2018x2170.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1566,&quot;width&quot;:1456,&quot;resizeWidth&quot;:590,&quot;bytes&quot;:2019367,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://blog.boxcars.ai/i/189148036?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb459c87-faf6-4829-81b3-ff8be4f2fe96_2018x2170.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!OUPX!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb459c87-faf6-4829-81b3-ff8be4f2fe96_2018x2170.png 424w, https://substackcdn.com/image/fetch/$s_!OUPX!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb459c87-faf6-4829-81b3-ff8be4f2fe96_2018x2170.png 848w, https://substackcdn.com/image/fetch/$s_!OUPX!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb459c87-faf6-4829-81b3-ff8be4f2fe96_2018x2170.png 1272w, https://substackcdn.com/image/fetch/$s_!OUPX!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Feb459c87-faf6-4829-81b3-ff8be4f2fe96_2018x2170.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>When you arrive, the page isn&#8217;t a list of search results with filters down the side &#8212; it&#8217;s a shared board. A catalog of available homes runs across the top, the full inventory. Below it, a working set that your agent, &#8220;Maya&#8221;, is curating for you. Her avatar sits next to yours in the top bar &#8212; not hidden in a chat sidebar, but at the table.</p><p>You tell Maya to show you homes you might like, and she goes to work on the board. She pulls listings from the catalog into the &#8220;Consider&#8221; lane &#8212; each one tagged with a &#8220;&#129302;&#8221; badge so you can see which cards she chose.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!ebDk!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab9a3109-c824-4900-b3b3-83f73c11df71_1112x1200.gif" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!ebDk!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab9a3109-c824-4900-b3b3-83f73c11df71_1112x1200.gif 424w, https://substackcdn.com/image/fetch/$s_!ebDk!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab9a3109-c824-4900-b3b3-83f73c11df71_1112x1200.gif 848w, https://substackcdn.com/image/fetch/$s_!ebDk!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab9a3109-c824-4900-b3b3-83f73c11df71_1112x1200.gif 1272w, https://substackcdn.com/image/fetch/$s_!ebDk!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab9a3109-c824-4900-b3b3-83f73c11df71_1112x1200.gif 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!ebDk!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab9a3109-c824-4900-b3b3-83f73c11df71_1112x1200.gif" width="649" height="700.3597122302158" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/ab9a3109-c824-4900-b3b3-83f73c11df71_1112x1200.gif&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1200,&quot;width&quot;:1112,&quot;resizeWidth&quot;:649,&quot;bytes&quot;:3695008,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/gif&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://blog.boxcars.ai/i/189148036?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab9a3109-c824-4900-b3b3-83f73c11df71_1112x1200.gif&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!ebDk!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab9a3109-c824-4900-b3b3-83f73c11df71_1112x1200.gif 424w, https://substackcdn.com/image/fetch/$s_!ebDk!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab9a3109-c824-4900-b3b3-83f73c11df71_1112x1200.gif 848w, https://substackcdn.com/image/fetch/$s_!ebDk!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab9a3109-c824-4900-b3b3-83f73c11df71_1112x1200.gif 1272w, https://substackcdn.com/image/fetch/$s_!ebDk!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fab9a3109-c824-4900-b3b3-83f73c11df71_1112x1200.gif 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Click into a listing and this is where it gets personal. The site shows the standard details &#8212; price, beds, baths, square footage &#8212; but below that, Maya has added a section: <strong>&#8220;How This Fits Your Week.&#8221;</strong> School drop-off stays around 10 minutes from this address, and your regular Central Market run stacks easily into weekday errands. She&#8217;s also flagged a concern: the noise level because of how close the lot is to a restaurant.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!EkOX!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cbd9406-bf85-4f47-bcea-b2dfd8d356a7_1890x1994.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!EkOX!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cbd9406-bf85-4f47-bcea-b2dfd8d356a7_1890x1994.png 424w, https://substackcdn.com/image/fetch/$s_!EkOX!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cbd9406-bf85-4f47-bcea-b2dfd8d356a7_1890x1994.png 848w, https://substackcdn.com/image/fetch/$s_!EkOX!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cbd9406-bf85-4f47-bcea-b2dfd8d356a7_1890x1994.png 1272w, https://substackcdn.com/image/fetch/$s_!EkOX!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cbd9406-bf85-4f47-bcea-b2dfd8d356a7_1890x1994.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!EkOX!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cbd9406-bf85-4f47-bcea-b2dfd8d356a7_1890x1994.png" width="651" height="686.7692307692307" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/5cbd9406-bf85-4f47-bcea-b2dfd8d356a7_1890x1994.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1536,&quot;width&quot;:1456,&quot;resizeWidth&quot;:651,&quot;bytes&quot;:1732054,&quot;alt&quot;:&quot;&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://blog.boxcars.ai/i/189148036?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cbd9406-bf85-4f47-bcea-b2dfd8d356a7_1890x1994.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" title="" srcset="https://substackcdn.com/image/fetch/$s_!EkOX!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cbd9406-bf85-4f47-bcea-b2dfd8d356a7_1890x1994.png 424w, https://substackcdn.com/image/fetch/$s_!EkOX!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cbd9406-bf85-4f47-bcea-b2dfd8d356a7_1890x1994.png 848w, https://substackcdn.com/image/fetch/$s_!EkOX!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cbd9406-bf85-4f47-bcea-b2dfd8d356a7_1890x1994.png 1272w, https://substackcdn.com/image/fetch/$s_!EkOX!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F5cbd9406-bf85-4f47-bcea-b2dfd8d356a7_1890x1994.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>No real estate site would ever show you this. These aren&#8217;t filters a product manager designed. This is your agent annotating listings with <em>your life</em> &#8212; your school, your grocery store, your weekend rhythm.</p><p>And here&#8217;s what the site <em>doesn&#8217;t</em> know: why Maya chose those listings. She searched for homes within a 15-minute drive of a specific address &#8212; but the site only saw the address and the radius, not the fact that your daughter goes to school there. The personal reasoning stays with your agent. The site provides the tools; your agent provides the strategy. The board doesn&#8217;t need to know why you&#8217;re making your moves.</p><p>And if you disagree with something Maya did &#8212; if she moved a listing you wanted to keep &#8212; just drag and move the card back into consideration. Maya can see your actions, as can the site. The board is shared; the control is yours.</p><h2>A Three-Player Game</h2><p>For thirty years, the web has been a two-player game. The site holds the intelligence &#8212; the data, the inventory, the recommendations. The user brings the context &#8212; search terms, clicks, form fields. That exchange is the whole interaction model.</p><p>But people are starting to invest in their own agents &#8212; training them with preferences, constraints, the texture of their daily lives. That makes the web a three-player game. And the current industry trajectory &#8212; making a site&#8217;s own AI smarter &#8212; may not be the right response. That intelligence is a stranger to the user. The user&#8217;s agent is not. The smarter the site makes its own AI, the more it risks becoming the commissioned sales associate who steps in front of the personal stylist.</p><p>The opportunity might be different: build the board, not the brain. A real estate site doesn&#8217;t make money when someone searches &#8212; it makes money when someone books a showing with a realtor. If the visitor&#8217;s agent helps them find the right homes faster, with higher confidence, they book viewings sooner and with stronger intent. The site wins the same way Neiman Marcus wins when a customer&#8217;s stylist picks out three perfect outfits: they&#8217;re still buying merchandise, and buying more of it because the match was better.</p><p>The more useful the <em>board</em>, the better the visitor&#8217;s agent can do its job &#8212; and the more reason people have to come to the site in the first place. Because if they can&#8217;t bring their agent to a site and work together effectively, they&#8217;ll find one where they can.</p><p>Luke Skywalker didn&#8217;t need the smartest X-wing. He needed one that flew well and let him and R2-D2 work together seamlessly. That might not be a bad blueprint for what comes next.</p><p></p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption"><em>Subscribe if you want to keep up. Forward to your agent if you want it to keep up with you.</em></p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p><p></p><p></p><p></p><p></p>]]></content:encoded></item><item><title><![CDATA[Bring Your Own Agent]]></title><description><![CDATA[How WebMCP gives AI a seat at every website]]></description><link>https://blog.boxcars.ai/p/bring-your-own-agent</link><guid isPermaLink="false">https://blog.boxcars.ai/p/bring-your-own-agent</guid><dc:creator><![CDATA[Tabrez Syed]]></dc:creator><pubDate>Thu, 19 Feb 2026 14:02:27 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1765288115376-d8d527c9b12f?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMHx8d2VicGFnZSUyMGRvb3J8ZW58MHx8fHwxNzcxNDk4OTA2fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" length="0" type="image/jpeg"/><content:encoded><![CDATA[<p></p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1765288115376-d8d527c9b12f?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMHx8d2VicGFnZSUyMGRvb3J8ZW58MHx8fHwxNzcxNDk4OTA2fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1765288115376-d8d527c9b12f?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMHx8d2VicGFnZSUyMGRvb3J8ZW58MHx8fHwxNzcxNDk4OTA2fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1765288115376-d8d527c9b12f?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMHx8d2VicGFnZSUyMGRvb3J8ZW58MHx8fHwxNzcxNDk4OTA2fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1765288115376-d8d527c9b12f?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMHx8d2VicGFnZSUyMGRvb3J8ZW58MHx8fHwxNzcxNDk4OTA2fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1765288115376-d8d527c9b12f?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMHx8d2VicGFnZSUyMGRvb3J8ZW58MHx8fHwxNzcxNDk4OTA2fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1765288115376-d8d527c9b12f?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMHx8d2VicGFnZSUyMGRvb3J8ZW58MHx8fHwxNzcxNDk4OTA2fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" width="5472" height="3080" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1765288115376-d8d527c9b12f?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMHx8d2VicGFnZSUyMGRvb3J8ZW58MHx8fHwxNzcxNDk4OTA2fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:3080,&quot;width&quot;:5472,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;A blue shuttered window on a yellow wall&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="A blue shuttered window on a yellow wall" title="A blue shuttered window on a yellow wall" srcset="https://images.unsplash.com/photo-1765288115376-d8d527c9b12f?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMHx8d2VicGFnZSUyMGRvb3J8ZW58MHx8fHwxNzcxNDk4OTA2fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1765288115376-d8d527c9b12f?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMHx8d2VicGFnZSUyMGRvb3J8ZW58MHx8fHwxNzcxNDk4OTA2fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1765288115376-d8d527c9b12f?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMHx8d2VicGFnZSUyMGRvb3J8ZW58MHx8fHwxNzcxNDk4OTA2fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1765288115376-d8d527c9b12f?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMHx8d2VicGFnZSUyMGRvb3J8ZW58MHx8fHwxNzcxNDk4OTA2fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption">Photo by <a href="https://unsplash.com/@jorisbeugels">Joris Beugels</a> on <a href="https://unsplash.com">Unsplash</a></figcaption></figure></div><p>&#8220;Mr. Watson, come here &#8212; I want to see you.&#8221;</p><p>Those were the first words ever spoken on a telephone. Alexander Graham Bell hadn&#8217;t meant it as a grand demonstration &#8212; he just needed his assistant in the room. But the irony is hard to miss: the most advanced communication device in history, and the first words it carried were a request for someone to be physically present. The telephone could transmit a voice across a wire. But it couldn&#8217;t point at anything.</p><p>Today, we&#8217;ve built ourselves the most capable assistants in history. They can reason through complex problems, recall details we&#8217;ve long forgotten, and increasingly, they&#8217;re starting to know us &#8212; our preferences, the way we like things done. And yet, every interaction follows the same script: we type into a little box, wait for text to appear, type again. We describe what we&#8217;re seeing. They describe what they&#8217;re thinking. Back and forth, through text.</p><p>Picture the absurdity of it. You&#8217;re staring at a website &#8212; a rich, visual interface full of images, layouts, interactive elements &#8212; and beside it, in a narrow chat panel, you&#8217;re trying to <em>describe</em> what you want to your AI assistant in words. It&#8217;s like calling someone on the phone to help you rearrange your living room. You can hear each other fine. But nobody can point.</p><p>For the past few years, the prevailing response has been to make the chat better. Chat gets smarter, richer, more capable &#8212; the telegraph becomes a fax. But what if the real leap isn&#8217;t a better chat? What if it&#8217;s getting in the same room?</p><h2>The Death of the Homepage (and Other Predictions)</h2><p>Last August, Fortune ran a piece with a blunt thesis: <a href="https://fortune.com/2025/08/26/homepage-is-dead-future-is-question-search-chatbots-ai/">the homepage is dead</a>. &#8220;The leading digital experiences of 2026 will be conversation systems with seamless visual supports, not websites in the traditional sense.&#8221; The numbers backed it up. Nearly 60% of Google searches now end without a single click &#8212; up from 26% just two years earlier. ChatGPT processes 2.5 billion prompts a day. Gartner predicts traditional search volume will drop 25% by the end of this year. Why visit a website when you can just ask?</p><p>The web took the hint. An entire industry sprang up around making sites readable by AI rather than visitable by humans. AIO &#8212; AI Optimization &#8212; became the new SEO, focused not on ranking in search results but on <a href="https://www.pageonepower.com/linkarati/what-is-ai-optimization-and-why-it-matters-for-seo-in-2026">getting your content cited by chatbots</a>. New protocols emerged to make sites machine-readable &#8212; structured data that AI agents could consume without ever rendering a page. The direction was clear: the web was becoming a data layer, and chat was becoming the interface.</p><div class="digest-post-embed" data-attrs="{&quot;nodeId&quot;:&quot;076eef72-1ebf-4610-bc5e-8c591052e612&quot;,&quot;caption&quot;:&quot;If you were a film director in the 90s, you'd spend opening weekend with your stomach in knots, waiting for Roger Ebert and Gene Siskel's verdict on your latest work. Those iconic \&quot;two thumbs up\&quot; weren't just reviews&#8212;they were career-makers. Studios would hold their breath as the critics delivered their judgment, knowing that a positive review could dri&#8230;&quot;,&quot;cta&quot;:&quot;Read full story&quot;,&quot;showBylines&quot;:true,&quot;size&quot;:&quot;md&quot;,&quot;isEditorNode&quot;:true,&quot;title&quot;:&quot;Ask Not What Your Customers Think of You, But What Their AI Thinks of You&quot;,&quot;publishedBylines&quot;:[{&quot;id&quot;:130480501,&quot;name&quot;:&quot;Tabrez Syed&quot;,&quot;bio&quot;:&quot;Programmer turned product manager. Now working on rethinking apps in a world of AI.&quot;,&quot;photo_url&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/4c5a7001-14b2-4bd4-b916-b853eb8381fd_3000x3918.jpeg&quot;,&quot;is_guest&quot;:false,&quot;bestseller_tier&quot;:null}],&quot;post_date&quot;:&quot;2025-03-13T13:02:56.212Z&quot;,&quot;cover_image&quot;:&quot;https://substackcdn.com/image/fetch/$s_!Uz5R!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc2bcc3f6-c8d5-4f3f-ae36-8c4192e606a8_1024x1024.webp&quot;,&quot;cover_image_alt&quot;:null,&quot;canonical_url&quot;:&quot;https://blog.boxcars.ai/p/ask-not-what-your-customers-think&quot;,&quot;section_name&quot;:null,&quot;video_upload_id&quot;:null,&quot;id&quot;:158907987,&quot;type&quot;:&quot;newsletter&quot;,&quot;reaction_count&quot;:1,&quot;comment_count&quot;:0,&quot;publication_id&quot;:1438382,&quot;publication_name&quot;:&quot;BoxCars AI&quot;,&quot;publication_logo_url&quot;:&quot;https://substackcdn.com/image/fetch/$s_!lhIv!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa43b3a40-40f4-4f9d-b843-b52a17a80bb9_1024x1024.png&quot;,&quot;belowTheFold&quot;:true,&quot;youtube_url&quot;:null,&quot;show_links&quot;:null,&quot;feed_url&quot;:null}"></div><p>And when text-only chat felt too limiting, the industry&#8217;s answer was to make chat richer. Anthropic introduced <a href="https://support.claude.com/en/articles/9487310-what-are-artifacts-and-how-do-i-use-them">Artifacts</a> &#8212; interactive mini-apps that render alongside your conversation. OpenAI followed with <a href="https://openai.com/index/introducing-canvas/">Canvas</a>, a collaborative workspace for writing and coding that lives inside ChatGPT. Then came <a href="https://shopify.engineering/mcp-ui-breaking-the-text-wall">MCP-UI</a>, which embedded full interactive components &#8212; product selectors, image galleries, booking forms &#8212; directly into chat conversations. Shopify&#8217;s engineering team explained the motivation plainly: a product &#8220;isn&#8217;t just a SKU and price &#8212; it&#8217;s images showing different angles, color swatches you can click, size selectors that update availability.&#8221; Text alone can&#8217;t carry that. So they built a way to put those elements inside the chat window. By January 2026, <a href="http://blog.modelcontextprotocol.io/posts/2026-01-26-mcp-apps/">MCP Apps became an official extension</a> of the protocol, letting any tool return rich UI that renders right in the conversation.</p><p>Each step made the chat better &#8212; richer components, more interactive widgets, fuller visual experiences squeezed into a conversation thread. But notice the assumption underneath all of it: the chat window remains the center of gravity. The website comes to the chat &#8212; as data, as embedded cards, as sandboxed iframes. Everything flows toward that narrow column of conversation.</p><p>And for simple tasks, it works. Ask a question, get an answer. Book a flight, confirm the details. But somewhere between &#8220;book me a flight&#8221; and &#8220;help me design a wedding invitation,&#8221; the chat window hits a wall. UX researchers have been <a href="https://medium.com/design-bootcamp/cognitive-and-computational-limitations-of-ai-chat-interfaces-a62d1a9d744a">flagging the problem</a>: text-based AI interfaces risk &#8220;regressing to high-memory-load, low-visual-feedback systems,&#8221; undoing decades of progress in interface design. One observer <a href="https://reconfigured.io/blog/beyond-the-chat-box-future-ai-interfaces-marko-jevremovic">put it more simply</a>: &#8220;Half of our work now is copy-pasting text from one chat to another.&#8221;</p><p>The fax machine got very good. But you still can&#8217;t rearrange furniture well with it.</p><h2>Bring Your Own Agent</h2><p>What if instead of bringing the website into the chat, the agent came to the website?</p><p>That&#8217;s the reversal at the heart of <a href="https://venturebeat.com/infrastructure/google-chrome-ships-webmcp-in-early-preview-turning-every-website-into-a">WebMCP</a>, a new browser standard that quietly shipped in Chrome&#8217;s early preview this month. The idea is simple: a web page can register its features as &#8220;tools&#8221; &#8212; functions with plain-language descriptions that an AI agent can discover and call directly. A real estate site might expose &#8220;filter by neighborhood&#8221; and &#8220;compare these two listings,&#8221; while a design tool offers &#8220;change background color&#8221; or &#8220;show me templates like this.&#8221; The agent doesn&#8217;t screenshot the page and guess where to click. It reads the menu of what&#8217;s available and calls the function. Techstrong.ai had the right headline: <a href="https://techstrong.ai/features/chrome-just-gave-ai-agents-their-own-front-door-to-the-web/">Chrome just gave AI agents their own front door to the web</a>.</p><p>The timing isn&#8217;t accidental. In late January, Google moved <a href="https://blog.google/products-and-platforms/products/chrome/gemini-3-auto-browse/">Gemini into Chrome&#8217;s side panel</a> &#8212; not as a floating window you summon, but as a multimodal presence that can see the page you&#8217;re on, understand images and text, and act on what it finds. Microsoft has been building the same thing with Copilot in Edge. As these agents gain voice capabilities, you won&#8217;t just type to them &#8212; you&#8217;ll talk to your agent while you&#8217;re both looking at the same page. The browser is becoming a two-seat vehicle.</p><p>And here&#8217;s what makes this different from every website bolting on its own chatbot over the past two years. Those chatbots were strangers. Every site you visited, you met a new one &#8212; a fresh AI that knew nothing about you, your preferences, your history. You had to start from scratch each time, explaining what you wanted to a stranger who worked for the site.</p><p>With WebMCP, you bring <em>your</em> agent. The Gemini that rides in Chrome&#8217;s side panel has been with you all day. It knows what you were researching this morning, what you bookmarked last week, what decisions you&#8217;ve been weighing. This is BYOA &#8212; bring your own agent &#8212; and it flips the first wave of AI on the web entirely on its head. Wave one was every website hiring its own AI, a stranger at every door. Wave two is you walking in with yours.</p><p>Consider the difference. You land on a wedding venue site. The site&#8217;s chatbot greets you and asks: how many guests? What date? Indoor or outdoor? What&#8217;s your budget? You type it all in, one field at a time, teaching a stranger about your wedding.</p><p>Now imagine arriving with your agent instead. Your agent already knows you&#8217;re planning for 150 guests, that you&#8217;ve been looking at June dates, that your partner keeps pinning rustic outdoor spaces. The moment you land on the page, your agent reads the site&#8217;s tools and filters the results before you&#8217;ve typed a word. The page loads and it&#8217;s already showing you what you came for. You scroll through photos, click on two that catch your eye, and ask your agent to check availability. The page updates &#8212; calendars and pricing appear for just those two.</p><p>It&#8217;s the difference between walking into a department store alone and walking in with a personal shopper who knows your wardrobe, your size, and what you already own. The personal shopper makes sure the dressing room only has clothes that fit, in colors you actually wear. You still choose. But you skip the tedious work of explaining yourself to every store from scratch.</p><p>The website provides the tools. Your agent brings the context.</p><p>We&#8217;re early. WebMCP is still in preview, the agents are still learning what to do with the tools they&#8217;re given, and there&#8217;s a lot to figure out about trust, permissions, and what happens when your personal agent meets a website&#8217;s business model. But the direction is clear, and it&#8217;s not the one most people predicted. The visual web isn&#8217;t dying. It&#8217;s not being swallowed by chat. It&#8217;s being redesigned, for the first time, with a second seat.</p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption"></p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p><p></p><p><em>Related</em></p><div class="digest-post-embed" data-attrs="{&quot;nodeId&quot;:&quot;d33c78d2-739b-4fb9-86c5-423fddea118e&quot;,&quot;caption&quot;:&quot;I&#8217;ve been building software for over two decades. The process always follows the same pattern: design the interface, ship it, then users bring their data.&quot;,&quot;cta&quot;:&quot;Read full story&quot;,&quot;showBylines&quot;:true,&quot;size&quot;:&quot;md&quot;,&quot;isEditorNode&quot;:true,&quot;title&quot;:&quot;Software That Sees Before It Asks&quot;,&quot;publishedBylines&quot;:[{&quot;id&quot;:130480501,&quot;name&quot;:&quot;Tabrez Syed&quot;,&quot;bio&quot;:&quot;Programmer turned product manager. Now working on rethinking apps in a world of AI.&quot;,&quot;photo_url&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/4c5a7001-14b2-4bd4-b916-b853eb8381fd_3000x3918.jpeg&quot;,&quot;is_guest&quot;:false,&quot;bestseller_tier&quot;:null}],&quot;post_date&quot;:&quot;2026-01-08T14:03:06.747Z&quot;,&quot;cover_image&quot;:&quot;https://images.unsplash.com/photo-1702905260008-03573d21dae5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw4N3x8Ymlub2N1bGFyc3xlbnwwfHx8fDE3Njc4NDk4NjN8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080&quot;,&quot;cover_image_alt&quot;:null,&quot;canonical_url&quot;:&quot;https://blog.boxcars.ai/p/software-that-sees-before-it-asks&quot;,&quot;section_name&quot;:null,&quot;video_upload_id&quot;:null,&quot;id&quot;:183876684,&quot;type&quot;:&quot;newsletter&quot;,&quot;reaction_count&quot;:1,&quot;comment_count&quot;:2,&quot;publication_id&quot;:1438382,&quot;publication_name&quot;:&quot;BoxCars AI&quot;,&quot;publication_logo_url&quot;:&quot;https://substackcdn.com/image/fetch/$s_!lhIv!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa43b3a40-40f4-4f9d-b843-b52a17a80bb9_1024x1024.png&quot;,&quot;belowTheFold&quot;:true,&quot;youtube_url&quot;:null,&quot;show_links&quot;:null,&quot;feed_url&quot;:null}"></div>]]></content:encoded></item><item><title><![CDATA[The Echo of Demand]]></title><description><![CDATA[What a 1960s supply chain simulation can tell us about the AI infrastructure boom]]></description><link>https://blog.boxcars.ai/p/the-echo-of-demand</link><guid isPermaLink="false">https://blog.boxcars.ai/p/the-echo-of-demand</guid><dc:creator><![CDATA[Tabrez Syed]]></dc:creator><pubDate>Thu, 12 Feb 2026 14:02:25 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1599290915883-e449350ca4a2?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8cmlwcGxlfGVufDB8fHx8MTc3MDg5NzY4N3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1599290915883-e449350ca4a2?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8cmlwcGxlfGVufDB8fHx8MTc3MDg5NzY4N3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1599290915883-e449350ca4a2?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8cmlwcGxlfGVufDB8fHx8MTc3MDg5NzY4N3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1599290915883-e449350ca4a2?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8cmlwcGxlfGVufDB8fHx8MTc3MDg5NzY4N3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1599290915883-e449350ca4a2?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8cmlwcGxlfGVufDB8fHx8MTc3MDg5NzY4N3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1599290915883-e449350ca4a2?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8cmlwcGxlfGVufDB8fHx8MTc3MDg5NzY4N3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1599290915883-e449350ca4a2?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8cmlwcGxlfGVufDB8fHx8MTc3MDg5NzY4N3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" width="4732" height="2947" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1599290915883-e449350ca4a2?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8cmlwcGxlfGVufDB8fHx8MTc3MDg5NzY4N3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:2947,&quot;width&quot;:4732,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;green and blue water wave&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="green and blue water wave" title="green and blue water wave" srcset="https://images.unsplash.com/photo-1599290915883-e449350ca4a2?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8cmlwcGxlfGVufDB8fHx8MTc3MDg5NzY4N3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1599290915883-e449350ca4a2?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8cmlwcGxlfGVufDB8fHx8MTc3MDg5NzY4N3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1599290915883-e449350ca4a2?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8cmlwcGxlfGVufDB8fHx8MTc3MDg5NzY4N3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1599290915883-e449350ca4a2?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8cmlwcGxlfGVufDB8fHx8MTc3MDg5NzY4N3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption">Photo by <a href="https://unsplash.com/@almairene">Alma Snortum-Phelps</a> on <a href="https://unsplash.com">Unsplash</a></figcaption></figure></div><p>Week 8. You own a small brewery&#8212;a regional Mexican lager that&#8217;s found its niche in local restaurants and corner stores. The order sheet says zero cases. Your warehouse is stacked with beer nobody&#8217;s buying.</p><p>A month ago, everything was steady. Four cases a week from your distributor, same as it had been for as long as you could remember. Then the order came in: twenty cases. Five times the normal run rate, overnight.</p><p>You shipped what you had and faced a sixteen-case backlog. A signal that strong meant something downstream had clicked. The expensive campaign you had bet on, the new distributor, whatever it was. You added a second shift, authorized overtime, expedited raw materials. You weren&#8217;t going to miss the moment.</p><p>Then the orders fell. Twelve. Eight. This week: zero.</p><p>The facilitator calls the game.</p><h2>The Game That Never Changes</h2><p>You&#8217;ve been playing the <a href="https://beergame.org/">Beer Game</a>, a supply chain simulation MIT has run for more than fifty years. The players change&#8212;Harvard MBAs, Fortune 500 executives, engineering students&#8212;but the outcome never does. Rational people, reasonable decisions, real information: same disaster every time.</p><p><a href="https://news.mit.edu/2016/professor-emeritus-jay-forrester-digital-computing-system-dynamics-pioneer-dies-1119">Jay Forrester</a> built the game in the 1960s after watching GE&#8217;s appliance factories swing between three shifts and mass layoffs with no obvious external cause. Management blamed market forces&#8212;unpredictable customer demand, competitive pressure. Forrester ran a simulation and proved otherwise: the oscillations came from inside the system, from the structure of how decisions and delays compounded each other. The problem isn&#8217;t the players. It&#8217;s the very structure.</p><p>This game has been demonstrating real-world patterns for decades. And, it might be a good lens for understanding the AI infrastructure build-out.</p><p>But first, let&#8217;s see how we got here.</p><h2>Four Weeks to Five-Fold</h2><p>To make the mechanics clear, we&#8217;re going to simplify: one retailer, one wholesaler, one distributor, one factory. A single product moving through a single supply chain.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!sPft!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfc77647-619b-43f4-bf0e-7527a1a9932d_1712x1553.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!sPft!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfc77647-619b-43f4-bf0e-7527a1a9932d_1712x1553.png 424w, https://substackcdn.com/image/fetch/$s_!sPft!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfc77647-619b-43f4-bf0e-7527a1a9932d_1712x1553.png 848w, https://substackcdn.com/image/fetch/$s_!sPft!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfc77647-619b-43f4-bf0e-7527a1a9932d_1712x1553.png 1272w, https://substackcdn.com/image/fetch/$s_!sPft!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfc77647-619b-43f4-bf0e-7527a1a9932d_1712x1553.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!sPft!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfc77647-619b-43f4-bf0e-7527a1a9932d_1712x1553.png" width="434" height="393.75961538461536" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/cfc77647-619b-43f4-bf0e-7527a1a9932d_1712x1553.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1321,&quot;width&quot;:1456,&quot;resizeWidth&quot;:434,&quot;bytes&quot;:190400,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://blog.boxcars.ai/i/187735400?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfc77647-619b-43f4-bf0e-7527a1a9932d_1712x1553.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!sPft!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfc77647-619b-43f4-bf0e-7527a1a9932d_1712x1553.png 424w, https://substackcdn.com/image/fetch/$s_!sPft!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfc77647-619b-43f4-bf0e-7527a1a9932d_1712x1553.png 848w, https://substackcdn.com/image/fetch/$s_!sPft!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfc77647-619b-43f4-bf0e-7527a1a9932d_1712x1553.png 1272w, https://substackcdn.com/image/fetch/$s_!sPft!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fcfc77647-619b-43f4-bf0e-7527a1a9932d_1712x1553.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption"><em>Steady state: four cases ordered, four in stock, at every layer.</em></figcaption></figure></div><p>The game starts in equilibrium. Customers buy four cases of beer a week, and that number flows unchanged through every layer&#8212;retailer to wholesaler to distributor to factory. Everyone orders four, ships four, keeps four cases as a buffer. Just enough to absorb a small demand shift without panic, not enough to tie up capital. The supply chain hums along.</p><p>Then one week, something shifts. Maybe a local promotion. Maybe a random fad for Mexican beer. Whatever the reason, customers order eight cases instead of four.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!ymbK!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc5e3d85-162b-4dfe-b14e-578cd6cc6626_1712x1553.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!ymbK!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc5e3d85-162b-4dfe-b14e-578cd6cc6626_1712x1553.png 424w, https://substackcdn.com/image/fetch/$s_!ymbK!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc5e3d85-162b-4dfe-b14e-578cd6cc6626_1712x1553.png 848w, https://substackcdn.com/image/fetch/$s_!ymbK!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc5e3d85-162b-4dfe-b14e-578cd6cc6626_1712x1553.png 1272w, https://substackcdn.com/image/fetch/$s_!ymbK!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc5e3d85-162b-4dfe-b14e-578cd6cc6626_1712x1553.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!ymbK!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc5e3d85-162b-4dfe-b14e-578cd6cc6626_1712x1553.png" width="475" height="430.9581043956044" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/fc5e3d85-162b-4dfe-b14e-578cd6cc6626_1712x1553.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1321,&quot;width&quot;:1456,&quot;resizeWidth&quot;:475,&quot;bytes&quot;:217337,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://blog.boxcars.ai/i/187735400?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc5e3d85-162b-4dfe-b14e-578cd6cc6626_1712x1553.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!ymbK!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc5e3d85-162b-4dfe-b14e-578cd6cc6626_1712x1553.png 424w, https://substackcdn.com/image/fetch/$s_!ymbK!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc5e3d85-162b-4dfe-b14e-578cd6cc6626_1712x1553.png 848w, https://substackcdn.com/image/fetch/$s_!ymbK!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc5e3d85-162b-4dfe-b14e-578cd6cc6626_1712x1553.png 1272w, https://substackcdn.com/image/fetch/$s_!ymbK!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Ffc5e3d85-162b-4dfe-b14e-578cd6cc6626_1712x1553.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption"><em>Customer demand doubles. The retailer&#8217;s buffer is gone. Everyone else still sees four.</em></figcaption></figure></div><p>The retailer&#8217;s shelf is empty by Friday. The four-case buffer vanished in a single day. Empty shelves mean lost sales, and so the retailer orders twelve-cases&#8212;eight to cover what looks like sustained demand, four to rebuild the vanished buffer.</p><p>But there&#8217;s a three-week lag between ordering and delivery. By the time Week 2 rolls around, demand has already dropped back to four. The retailer sees this, pulls the next order down to eight as a cautious correction, and feels good about adapting to what was probably just a temporary spike.</p><p>That original twelve-case order, though? Already on its way upstream.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Foh6!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F69515a2d-9316-4efb-ad25-6f50d7530320_1712x1553.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Foh6!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F69515a2d-9316-4efb-ad25-6f50d7530320_1712x1553.png 424w, https://substackcdn.com/image/fetch/$s_!Foh6!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F69515a2d-9316-4efb-ad25-6f50d7530320_1712x1553.png 848w, https://substackcdn.com/image/fetch/$s_!Foh6!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F69515a2d-9316-4efb-ad25-6f50d7530320_1712x1553.png 1272w, https://substackcdn.com/image/fetch/$s_!Foh6!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F69515a2d-9316-4efb-ad25-6f50d7530320_1712x1553.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Foh6!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F69515a2d-9316-4efb-ad25-6f50d7530320_1712x1553.png" width="490" height="444.5673076923077" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/69515a2d-9316-4efb-ad25-6f50d7530320_1712x1553.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1321,&quot;width&quot;:1456,&quot;resizeWidth&quot;:490,&quot;bytes&quot;:226695,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://blog.boxcars.ai/i/187735400?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F69515a2d-9316-4efb-ad25-6f50d7530320_1712x1553.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Foh6!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F69515a2d-9316-4efb-ad25-6f50d7530320_1712x1553.png 424w, https://substackcdn.com/image/fetch/$s_!Foh6!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F69515a2d-9316-4efb-ad25-6f50d7530320_1712x1553.png 848w, https://substackcdn.com/image/fetch/$s_!Foh6!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F69515a2d-9316-4efb-ad25-6f50d7530320_1712x1553.png 1272w, https://substackcdn.com/image/fetch/$s_!Foh6!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F69515a2d-9316-4efb-ad25-6f50d7530320_1712x1553.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption"><em>The retailer has already corrected. The wholesaler is just seeing the spike.</em></figcaption></figure></div><p>The wholesaler sees twelve cases on the order form&#8212;triple the normal run rate. Business must be picking up. They ship the four cases in inventory and face an eight-case shortfall. The warehouse is empty, and the choice is obvious: order sixteen from the distributor. Twelve to meet the new demand level, four to rebuild the buffer.</p><p>The retailer&#8217;s new order&#8212;the eight cases that says &#8220;it was just a spike, we&#8217;re back to normal&#8221;&#8212;won&#8217;t reach the wholesaler until next week. By then, the sixteen-case order has already hit the distributor.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Lok4!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0367d941-fed2-4f91-b463-9f187ccde0ff_1712x1553.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Lok4!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0367d941-fed2-4f91-b463-9f187ccde0ff_1712x1553.png 424w, https://substackcdn.com/image/fetch/$s_!Lok4!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0367d941-fed2-4f91-b463-9f187ccde0ff_1712x1553.png 848w, https://substackcdn.com/image/fetch/$s_!Lok4!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0367d941-fed2-4f91-b463-9f187ccde0ff_1712x1553.png 1272w, https://substackcdn.com/image/fetch/$s_!Lok4!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0367d941-fed2-4f91-b463-9f187ccde0ff_1712x1553.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Lok4!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0367d941-fed2-4f91-b463-9f187ccde0ff_1712x1553.png" width="499" height="452.7328296703297" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/0367d941-fed2-4f91-b463-9f187ccde0ff_1712x1553.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1321,&quot;width&quot;:1456,&quot;resizeWidth&quot;:499,&quot;bytes&quot;:214238,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://blog.boxcars.ai/i/187735400?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0367d941-fed2-4f91-b463-9f187ccde0ff_1712x1553.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!Lok4!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0367d941-fed2-4f91-b463-9f187ccde0ff_1712x1553.png 424w, https://substackcdn.com/image/fetch/$s_!Lok4!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0367d941-fed2-4f91-b463-9f187ccde0ff_1712x1553.png 848w, https://substackcdn.com/image/fetch/$s_!Lok4!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0367d941-fed2-4f91-b463-9f187ccde0ff_1712x1553.png 1272w, https://substackcdn.com/image/fetch/$s_!Lok4!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F0367d941-fed2-4f91-b463-9f187ccde0ff_1712x1553.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption"><em>The signal grows at each layer. The distributor sees sixteen &#8212; four times normal &#8212; while the retailer is back to baseline</em></figcaption></figure></div><p>The distributor sees sixteen cases&#8212;four times normal. Same pattern: ship the four in stock, stare at the twelve-case gap, order twenty upstream to cover the surge and rebuild the safety margin. The wave is building.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!dnJy!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c56e1af-c2e3-4154-897b-2bbc340a6a6d_1685x1553.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!dnJy!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c56e1af-c2e3-4154-897b-2bbc340a6a6d_1685x1553.png 424w, https://substackcdn.com/image/fetch/$s_!dnJy!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c56e1af-c2e3-4154-897b-2bbc340a6a6d_1685x1553.png 848w, https://substackcdn.com/image/fetch/$s_!dnJy!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c56e1af-c2e3-4154-897b-2bbc340a6a6d_1685x1553.png 1272w, https://substackcdn.com/image/fetch/$s_!dnJy!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c56e1af-c2e3-4154-897b-2bbc340a6a6d_1685x1553.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!dnJy!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c56e1af-c2e3-4154-897b-2bbc340a6a6d_1685x1553.png" width="559" height="515.2321428571429" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/1c56e1af-c2e3-4154-897b-2bbc340a6a6d_1685x1553.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1342,&quot;width&quot;:1456,&quot;resizeWidth&quot;:559,&quot;bytes&quot;:215473,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://blog.boxcars.ai/i/187735400?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c56e1af-c2e3-4154-897b-2bbc340a6a6d_1685x1553.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!dnJy!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c56e1af-c2e3-4154-897b-2bbc340a6a6d_1685x1553.png 424w, https://substackcdn.com/image/fetch/$s_!dnJy!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c56e1af-c2e3-4154-897b-2bbc340a6a6d_1685x1553.png 848w, https://substackcdn.com/image/fetch/$s_!dnJy!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c56e1af-c2e3-4154-897b-2bbc340a6a6d_1685x1553.png 1272w, https://substackcdn.com/image/fetch/$s_!dnJy!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c56e1af-c2e3-4154-897b-2bbc340a6a6d_1685x1553.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption"><em>Twenty cases hit the factory. The spike has been amplified five-fold &#8212; and it&#8217;s already over downstream.</em></figcaption></figure></div><p>The order arrives at your factory: twenty cases. Five times the normal run. You ship the four you have ready, clear out finished goods, and look at the sixteen-case backlog. This isn&#8217;t a blip&#8212;this is the trajectory you&#8217;ve been waiting for. Time to scale. Second shift, overtime, expedited materials. The breakthrough moment.</p><p>What you can&#8217;t see from the factory floor: the correction was already in motion three weeks ago. The retailer had dialed back to eight cases by Week 2. But each layer upstream was still reacting to the signal from the week before&#8212;adding buffer, staying one step behind the truth. By the time the wave reached you, the original spike had been gone for three weeks.</p><p>You weren&#8217;t responding to demand. You were responding to the echo of demand.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!CjzT!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc593d48b-d3d2-4c21-8f7a-d59250096286_1712x1553.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!CjzT!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc593d48b-d3d2-4c21-8f7a-d59250096286_1712x1553.png 424w, https://substackcdn.com/image/fetch/$s_!CjzT!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc593d48b-d3d2-4c21-8f7a-d59250096286_1712x1553.png 848w, https://substackcdn.com/image/fetch/$s_!CjzT!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc593d48b-d3d2-4c21-8f7a-d59250096286_1712x1553.png 1272w, https://substackcdn.com/image/fetch/$s_!CjzT!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc593d48b-d3d2-4c21-8f7a-d59250096286_1712x1553.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!CjzT!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc593d48b-d3d2-4c21-8f7a-d59250096286_1712x1553.png" width="508" height="460.89835164835165" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/c593d48b-d3d2-4c21-8f7a-d59250096286_1712x1553.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1321,&quot;width&quot;:1456,&quot;resizeWidth&quot;:508,&quot;bytes&quot;:257863,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://blog.boxcars.ai/i/187735400?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc593d48b-d3d2-4c21-8f7a-d59250096286_1712x1553.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!CjzT!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc593d48b-d3d2-4c21-8f7a-d59250096286_1712x1553.png 424w, https://substackcdn.com/image/fetch/$s_!CjzT!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc593d48b-d3d2-4c21-8f7a-d59250096286_1712x1553.png 848w, https://substackcdn.com/image/fetch/$s_!CjzT!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc593d48b-d3d2-4c21-8f7a-d59250096286_1712x1553.png 1272w, https://substackcdn.com/image/fetch/$s_!CjzT!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fc593d48b-d3d2-4c21-8f7a-d59250096286_1712x1553.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption"><em>Orders have collapsed. Inventory piles up at every layer &#8212; worst at the factory, which scaled up last.</em></figcaption></figure></div><h2>Echo or Signal?</h2><p>Every decision was rational. The customer demand spike was real&#8212;people genuinely wanted Mexican beer that week. Each player saw empty inventory, ordered more to cover the shortfall and rebuild their buffer. Nobody fabricated numbers. Nobody panicked.</p><p>But a one-week spike that settled immediately amplified into a five-fold surge by the time it reached the factory. This is the bullwhip effect&#8212;small fluctuations at retail become large swings upstream. The structure is almost elegant in its simplicity: time delays mean each layer can only see the order from directly below, not the original customer demand. Inventory runs out, you order more. Your partner&#8217;s order spikes, you add buffer.</p><p>Now add back the complexity we stripped out. Multiple retailers, each responding independently. Multi-week demand patterns that look like trends. Competing signals from different channels. And crucially: narrative.</p><p>By the time that twenty-case order reaches your factory, it doesn&#8217;t land as &#8220;echo of a temporary spike.&#8221; It lands as confirmation. The marketing campaign worked. The regional expansion paid off. Time to go national. Champagne breaks out. The executive team celebrates. The board approves new facilities, new hires, new capacity.</p><p>The structure creates the outcome. But the narrative shapes what happens next.</p><h2>Cisco&#8217;s $2.25 Billion Echo</h2><p>This simulation is a pattern that plays out with real consequences repeatedly.</p><p>Cisco experienced this in 2001. The dot-com boom was real&#8212;startups launching daily, venture capital flowing freely, businesses racing to get online. Every one of those startups needed routers. Every ISP was expanding capacity. Every telecom was building out infrastructure. The demand was genuine.</p><p>Cisco&#8217;s contract manufacturers were ordering independently&#8212;each responding to their own slice of the orders, each adding buffer.</p><p>By the time those orders reached Cisco&#8217;s supply chain, they validated the narrative - the internet was taking over, Cisco was winning. Hiring surged, production expanded, new facilities broke ground. The stock soared.</p><p>Then the boom ended. Cisco held over <a href="https://supplychainnuggets.com/learning-from-ciscos-2-25-billion-inventory-collapse/">$2.25 billion in unsold inventory</a>, the stock fell 84%, and <a href="https://money.cnn.com/2001/03/09/technology/cisco/index.htm">eight thousand jobs disappeared</a>.</p><p>Same game. Different product.</p><h2>Same Game, Longer Delays</h2><p>Now let&#8217;s look at AI infrastructure through the lens of the beer game. We don&#8217;t have the full story&#8212;companies don&#8217;t publish their internal decision-making, and supply chains are complex. But we can trace the basic structure: customers use AI models, AI labs like Anthropic power those models by renting compute from cloud providers (hyperscalers) like AWS, those providers order datacenters from builders, and builders need power from utilities. We could trace a similar supply chain to semiconductor and other suppliers as well but we&#8217;ll stick with data center construction and power since that&#8217;s in the news lately.</p><p>Like in our beer story, we start with a demand spike. When <a href="https://www.anthropic.com/news/claude-3-family">Claude 3 launched in March 2024</a>, coding assistants could finally work longer on more complicated tasks. <a href="https://www.aicerts.ai/news/anthropics-specialized-llm-claude-code-reaches-1b-run-rate/">Claude Code</a> hit a $1 billion run rate as developers and non-developers alike rushed to try it. Anthropic&#8217;s <a href="https://www.visualcapitalist.com/charted-the-soaring-revenues-of-ai-companies-2023-2025/">total revenue climbed from $1 billion</a> at the end of 2024 to a <a href="https://www.reuters.com/technology/artificial-intelligence/anthropic-projects-much-26-billion-annualized-revenue-2026-2025-12-23/">$9 billion annualized run rate</a> by the end of 2025, with <a href="https://www.reuters.com/technology/artificial-intelligence/anthropic-projects-much-26-billion-annualized-revenue-2026-2025-12-23/">enterprise customers driving 80%</a> of that revenue. The demand was real. But is this the moment AI coding permanently changes how software gets built&#8212;or is everyone just trying Mexican beer because it&#8217;s Cinco de Mayo?</p><p>And just like the retailer who ordered twelve cases instead of four, Anthropic needed to add buffer. Running out of compute means users leave for competitors. <a href="https://www.wheresyoured.at/costs/">Through September 2025</a>, the company spent $2.66 billion on AWS compute against $2.55 billion in revenue&#8212;and inference costs came in <a href="https://www.theinformation.com/articles/anthropic-lowers-profit-margin-projection-revenue-skyrockets">23% higher than the company expected</a>, compressing margins and pushing expenses above plan. The orders flowing to AWS were already larger than Anthropic had budgeted for.</p><p>Pulling back wasn&#8217;t an option. OpenAI exited 2025 at roughly $20 billion in annualized revenue with 900 million weekly active users. Anthropic, almost entirely dependent on enterprise contracts, was <a href="https://www.theinformation.com/articles/anthropic-lowers-profit-margin-projection-revenue-skyrockets">burning cash at a similar rate</a> with a fraction of the user base. Slowing down meant losing customers to a competitor with a hundred times the audience. So Anthropic is planning for <a href="https://www.theinformation.com/articles/anthropic-lowers-profit-margin-projection-revenue-skyrockets">$18 billion in revenue this year, $55 billion next year</a>, with break-even pushed to 2028. Training costs alone: $12 billion this year, $23 billion next. The order flowing upstream to AWS keeps getting bigger.</p><p>Anthropic&#8217;s primary cloud provider is AWS. Like the wholesaler receiving that twelve-case order, AWS sees the signal and responds. But they&#8217;re not just seeing Anthropic. They&#8217;re seeing orders from other AI labs too, each booking capacity independently. AWS can&#8217;t afford to run out and lose customers to Microsoft or Google. <a href="https://www.vedp.org/press-release/2023-01/amazon-web-services-2023">Back in January 2023</a>, they&#8217;d announced a $35 billion Virginia commitment by 2040, and by <a href="https://www.datacenterfrontier.com/hyperscale/article/33010712/aws-plans-11b-investment-for-2-data-center-campuses-in-louisa-county-va-by-2040">October of that year</a> were filing applications for $11 billion in datacenters in rural Louisa County. The expansion continued: <a href="https://www.datacenterdynamics.com/en/news/aws-activates-project-rainier-cluster-of-nearly-500000-trainium2-chips/">in October 2025</a>, they activated a massive computing site in Indiana. Build bigger, add buffer, don&#8217;t run out.</p><p>Builders watching this expansion saw the orders multiply. Turner Construction&#8217;s datacenter revenue <a href="https://www.rprealtyplus.com/news-views/turner-construction-doubles-data-center-revenue-as-ai-projects-drive-40-backlog-122938.html">nearly doubled</a>&#8212;from $3.6 billion in 2024 to $6.4 billion in just nine months of 2025. Orders were coming from AWS, Microsoft, Google&#8212;each hyperscaler ordering independently. Same pattern as the factory seeing the twenty-case order: scale up fast, hire more crews.</p><p>Dominion Energy, Virginia&#8217;s largest utility, watched the Northern Virginia corridor transform. Datacenter projects were appearing in every forecast, and the company&#8217;s contracted capacity <a href="https://www.datacenterdynamics.com/en/news/dominion-energy-nearly-doubles-data-center-capacity-under-contract-to-40gw/">jumped from 21 gigawatts in July 2024 to 40 gigawatts</a> a year later&#8212;an 88% increase. Dominion&#8217;s response: a <a href="https://www.power-technology.com/news/dominion-capital-expenditure-data-centre-demand/">five-year capital plan</a> totaling $50.1 billion, with $41 billion earmarked for Virginia&#8217;s grid, generation, and transmission projects to support datacenters. New generation capacity, transmission upgrades, substations.</p><p>But the Beer Game&#8217;s real lesson is about timing. In the simulation, the wave comes and goes in weeks&#8212;fast enough to see the full cycle, fast enough for everyone to see. In AI infrastructure, the cycle runs on years. Power infrastructure <a href="https://www.iea.org/data-and-statistics/charts/average-power-generation-construction-time-capacity-weighted-2010-2018">takes three to five years</a> to build. Commitments made in 2023 won&#8217;t complete until 2028. If the demand wave breaks before construction finishes, you don&#8217;t just end up with excess inventory. You end up with half-built infrastructure.</p><p>We&#8217;ve seen this pattern before. China&#8217;s real estate boom was amazing until it wasn&#8217;t. Now China has entire cities of unfinished apartment blocks, half-built infrastructure projects, and stranded capital. The wave broke before construction finished.</p><p>Same game. Different product.</p><h2>Knowing Doesn&#8217;t Help</h2><p>The Beer Game is one of the most-taught supply chain lesson in business history. You&#8217;ve probably played it yourself. You know about the bullwhip. You can see the structure. That was never the problem.</p><p>The problem is that you didn&#8217;t start a brewery to study supply chains. You started it because you believe Mexican beer&#8217;s moment is coming&#8212;that it stops being the niche choice and becomes the default. Four cases a week keeps the lights on. It was never the plan. The plan was always the hockey stick: the quarter where orders jump and keep jumping, where the revenue curve bends and doesn&#8217;t bend back. You&#8217;ve been waiting for it since you signed the lease.</p><p>The bullwhip looks exactly like the hockey stick. Same spike on the order sheet. Same revenue curve. Same boardroom energy. And when it arrives, everything around you confirms it. The stock price climbs. Your employees&#8217; options, worth nothing at four cases a week, suddenly mean something. The board stops asking &#8220;when&#8221; and starts asking &#8220;how fast.&#8221; Analysts upgrade. Investors come calling. Every signal you&#8217;re receiving says the moment has arrived.</p><p>What would it take to look at all of that and say: it&#8217;s just Cinco de Mayo?</p><div><hr></div><p></p>]]></content:encoded></item><item><title><![CDATA[When AI Becomes Plumbing]]></title><description><![CDATA[How AI moves from product to infrastructure]]></description><link>https://blog.boxcars.ai/p/when-ai-becomes-plumbing</link><guid isPermaLink="false">https://blog.boxcars.ai/p/when-ai-becomes-plumbing</guid><dc:creator><![CDATA[Tabrez Syed]]></dc:creator><pubDate>Thu, 05 Feb 2026 14:03:54 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1646009445351-b8192e095f3a?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyNXx8cGx1bWJpbmd8ZW58MHx8fHwxNzcwMjY5MjU1fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1646009445351-b8192e095f3a?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyNXx8cGx1bWJpbmd8ZW58MHx8fHwxNzcwMjY5MjU1fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1646009445351-b8192e095f3a?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyNXx8cGx1bWJpbmd8ZW58MHx8fHwxNzcwMjY5MjU1fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1646009445351-b8192e095f3a?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyNXx8cGx1bWJpbmd8ZW58MHx8fHwxNzcwMjY5MjU1fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1646009445351-b8192e095f3a?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyNXx8cGx1bWJpbmd8ZW58MHx8fHwxNzcwMjY5MjU1fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1646009445351-b8192e095f3a?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyNXx8cGx1bWJpbmd8ZW58MHx8fHwxNzcwMjY5MjU1fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1646009445351-b8192e095f3a?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyNXx8cGx1bWJpbmd8ZW58MHx8fHwxNzcwMjY5MjU1fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" width="4928" height="3264" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1646009445351-b8192e095f3a?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyNXx8cGx1bWJpbmd8ZW58MHx8fHwxNzcwMjY5MjU1fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:3264,&quot;width&quot;:4928,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;a close up of a bunch of pipes on a wall&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="a close up of a bunch of pipes on a wall" title="a close up of a bunch of pipes on a wall" srcset="https://images.unsplash.com/photo-1646009445351-b8192e095f3a?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyNXx8cGx1bWJpbmd8ZW58MHx8fHwxNzcwMjY5MjU1fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1646009445351-b8192e095f3a?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyNXx8cGx1bWJpbmd8ZW58MHx8fHwxNzcwMjY5MjU1fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1646009445351-b8192e095f3a?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyNXx8cGx1bWJpbmd8ZW58MHx8fHwxNzcwMjY5MjU1fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1646009445351-b8192e095f3a?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyNXx8cGx1bWJpbmd8ZW58MHx8fHwxNzcwMjY5MjU1fDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption">Photo by <a href="https://unsplash.com/@rstar50">Roger Starnes Sr</a> on <a href="https://unsplash.com">Unsplash</a></figcaption></figure></div><p></p><p>What does it mean to use AI today?</p><p>You open a browser tab. ChatGPT. Claude. Maybe Gemini. You type a question, get an answer, close the tab. That&#8217;s AI. It&#8217;s an app. A website. A thing you do.</p><p>Meanwhile, your computer has no idea any of this happened. Your calendar doesn&#8217;t know. Your email client doesn&#8217;t know. AI lives in a browser tab, isolated from everything else on your machine.</p><p>We&#8217;ve been here before.</p><h2>When the Network Was Elsewhere</h2><p>In 1994, you could go online. You&#8217;d launch AOL or CompuServe, hear the modem screech and hiss&#8212;<a href="https://www.popularmechanics.com/science/a29611456/internet-dialup-modem-sounds/">two machines negotiating in audible data</a>&#8212;and suddenly you were somewhere else. Science fiction had taught us to call it cyberspace: a neon-lit elsewhere you jacked into. You&#8217;d check email, browse content, maybe enter a chat room. Then you&#8217;d disconnect and your computer would be offline again.</p><p>The network was a place you visited. Your computer didn&#8217;t live there.</p><p>Windows 3.1 didn&#8217;t know what TCP/IP was. If you wanted your computer to actually speak the language of the internet, you needed third-party software like <a href="https://en.wikipedia.org/wiki/Trumpet_Winsock">Trumpet Winsock</a>&#8212;a $30 shareware stack that required manual configuration. It was like teaching your computer a foreign language it was never designed to speak.</p><p>This wasn&#8217;t just inconvenient. It was architectural. Your spreadsheet couldn&#8217;t fetch data. Your calendar had no idea the network existed. If you wanted information from the internet in another program, you were the messenger: copy from AOL, paste into Word, write down the weather forecast, manually add the phone number to your contact book.</p><p>Networking was something you made your computer do, temporarily, by launching special software and shepherding data between worlds. Sound familiar?</p><h2>When Your Computer Joined the Network</h2><p>In August 1995, <a href="https://tangentsoft.com/wskfaq/articles/history.html">Windows 95 shipped with TCP/IP built in</a>. The operating system could finally speak the language of the internet natively. And once it wasn&#8217;t something you did but something your computer <em>was</em>&#8212;the world changed.</p><p>Because things started happening without you.</p><p>You&#8217;re asleep. Your computer isn&#8217;t. At 3am it checks a server in Redmond, downloads a security patch, installs it, restarts a background process. You never know this happened. You never needed to know. Before, updating software meant, ordering a floppy disk, waiting for it to arrive, running the installer. Now software just... stayed current. Your computer reached out and fixed itself.</p><p>Your calendar receives an email with meeting details. It parses the date, the time, the location, checks for conflicts, adds the event, sets a reminder, syncs to your phone. You open your calendar the next morning and the meeting is there.</p><p>The weather widget on your desktop updates every hour. The clock synchronizes itself with atomic time servers. Your documents back up to a server farm you&#8217;ll never see. Your photos upload while you sleep.</p><p>Run <code>netstat</code> on your computer right now. Count the active connections. Dozens of processes you&#8217;ve never heard of are talking to servers you&#8217;ve never seen&#8212;fetching, syncing, checking, reporting. Your computer isn&#8217;t occasionally visiting the internet. It lives there. It&#8217;s a participant on the network, acting on your behalf, in the background, constantly.</p><p>The cyberspace that science fiction imagined&#8212;that neon elsewhere you&#8217;d jack into&#8212;never materialized. What happened was stranger. The network dissolved into everything. You stopped &#8220;going online&#8221; because there was no longer an offline to go from. The internet became plumbing: invisible, assumed, always on.</p><p>Once infrastructure is in place, the world reorganizes around it. Microsoft didn&#8217;t predict weather widgets or automatic updates or cloud sync. No one in 1995 sat down and designed the networked future. It got co-created. Once developers could assume networking existed, they built things that only made sense <em>because</em> that infrastructure was there. The applications emerged from the capabilities. Millions of developers suddenly had a capacity they could take for granted, and the explosion of what became possible was impossible to predict beforehand.</p><h2>This Pattern Is Repeating</h2><p>In June 2024, Microsoft shipped the <a href="https://www.infoworld.com/article/2337328/copilot-runtime-building-ai-into-windows.html">Windows Copilot Runtime</a>&#8212;a native AI layer built directly into the operating system. Not an app you install. Not a service you subscribe to. Plumbing. The OS now includes more than 40 machine learning models and a specialized small language model called <a href="https://www.infoworld.com/article/3823290/diving-into-the-windows-copilot-runtime.html">Phi Silica</a>, designed to run on your local hardware.</p><p>Apple made the same move. In October 2024, they rolled out <a href="https://www.apple.com/newsroom/2024/09/apple-intelligence-comes-to-iphone-ipad-and-mac-starting-next-month/">Apple Intelligence</a>&#8212;a <a href="https://machinelearning.apple.com/research/introducing-apple-foundation-models">3 billion parameter model</a> running natively on Apple silicon. The model lives in unified memory alongside everything else your computer does. It can see what&#8217;s on your screen. It can take action across apps. It can understand context in ways that a browser-based chatbot never could, because it&#8217;s not a visitor&#8212;it&#8217;s part of the house.</p><p>Both companies are building the same architecture: small, capable models embedded in the OS that can handle most tasks locally, routing to larger cloud models only when necessary. The operating system decides where computation happens&#8212;local chip, cloud server, hybrid&#8212;just like TCP/IP decides how packets get routed. Apps don&#8217;t need to think about it. They just call the API.</p><p>This unlocks something new: automatic behavior.</p><p>Right now, cloud-based AI features are almost always click-gated. You open ChatGPT. You ask a question. You wait for a response. Why? Because running inference in the cloud costs money. Why run expensive computation if the user might not use it?</p><p>But when the model runs locally on your device, the marginal cost per inference drops to nearly zero. Suddenly, your OS can do things without the user initiating.</p><p>Your computer could be constantly working on your behalf using AI, the way it constantly works on your behalf using networking.</p><p>And it can do this because your context is already there&#8212;your files, your data, everything your computer knows about you is local. There&#8217;s no round trip to a cloud service. No data leaving your machine. Just local intelligence working with local information.</p><p>Apps can assume AI exists the way they assume the file system exists, the way they assume networking exists.</p><p>And once apps can assume that, the effort to develop AI features disappears into the plumbing. Developers will build on whichever platform makes it easiest&#8212;whoever provides the simplest APIs, the fewest obstacles between an idea and a working feature.</p><h2>Everyone Is Racing to Be the Plumbing</h2><p>Whoever owns the plumbing layer becomes the gatekeeper. And gatekeeping is lucrative.</p><p>Apple&#8217;s App Store <a href="https://www.techloy.com/apple-made-10-billion-from-u-s-app-store-commissions-in-2024-now-its-fighting-to-keep-it/">earned the company $27.4 billion in commissions in 2024</a>&#8212;$10 billion from the U.S. alone.</p><p>If the next generation of applications are AI-enabled&#8212;and they will be&#8212;whoever controls the AI infrastructure controls which apps get built and where they&#8217;re distributed.</p><p>The economics are too large to ignore. This isn&#8217;t just about technical capability. It&#8217;s about defending and extending the most profitable layer of the stack.</p><p>Google sees this happening and has a problem. Chrome OS exists, but it runs on maybe 2% of the world&#8217;s computers&#8212;mostly in schools. They can&#8217;t own the operating system layer on the machines most people use for work.</p><p>But they don&#8217;t need to.</p><p>Chrome runs on <a href="https://gs.statcounter.com/browser-market-share">65% of all browsers worldwide</a>. And increasingly, the browser <em>is</em> the platform that matters. Your documents live in Google Docs, your design work happens in Figma, your spreadsheets run in Airtable. The operating system launches Chrome, and then Chrome becomes the environment where actual work happens.</p><p>So Google is building AI into Chrome itself. In December 2024, they <a href="https://developers.googleblog.com/on-device-genai-in-chrome-chromebook-plus-and-pixel-watch-with-litert-lm/">embedded Gemini Nano directly in the browser</a>&#8212;a small language model that runs locally, processing data without it ever leaving your machine. Any web application can call it. The browser becomes the AI layer, sitting between web apps and AI capabilities the same way Windows and macOS sit between native apps and AI capabilities.</p><p>The platform doesn&#8217;t have to be the operating system. It just has to be where developers build and where users spend their time. For Microsoft and Apple, that&#8217;s the OS. For Google, it&#8217;s one layer up.</p><h2>Building Infrastructure Is One Thing. Knowing How to Use It Is Another.</h2><p>In November 2024, Windows president Pavan Davuluri announced that Windows would &#8220;evolve into an agentic OS.&#8221; The response was thousands of overwhelmingly negative replies. But what does an &#8220;agentic OS&#8221; actually look like?</p><p>Microsoft&#8217;s answer seemed to be: <a href="https://www.windowscentral.com/software-apps/windows-11/microsoft-is-walking-back-windows-11s-ai-overload-scaling-down-copilot-and-rethinking-recall-in-a-major-shift">put a Copilot button everywhere</a>&#8212;File Explorer, Notepad, Paint, Settings. Every application got AI integration whether it made sense or not. Users weren&#8217;t ready for it.</p><p>Then there&#8217;s Recall&#8212;a feature that would screenshot everything you do and make it searchable with AI. As an idea, it&#8217;s interesting. As an implementation, the privacy concerns were immediate and loud. Microsoft postponed it by a year. Now they&#8217;re <a href="https://www.windowscentral.com/software-apps/windows-11/microsoft-is-walking-back-windows-11s-ai-overload-scaling-down-copilot-and-rethinking-recall-in-a-major-shift">backing off</a>: removing Copilot buttons from apps, rethinking Recall, pausing new integrations.</p><p>But the Windows Copilot Runtime&#8212;the infrastructure&#8212;that&#8217;s staying.</p><p>This is typical early-infrastructure behavior. When you build new plumbing, you don&#8217;t immediately know the right way to surface it. That gets co-created over time, through experimentation and iteration. Not every attempt works. That&#8217;s normal.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!Y6X3!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb64b5d0-12e8-4b50-a7ec-8a10ce99b2bc_640x480.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!Y6X3!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb64b5d0-12e8-4b50-a7ec-8a10ce99b2bc_640x480.png 424w, https://substackcdn.com/image/fetch/$s_!Y6X3!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb64b5d0-12e8-4b50-a7ec-8a10ce99b2bc_640x480.png 848w, https://substackcdn.com/image/fetch/$s_!Y6X3!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb64b5d0-12e8-4b50-a7ec-8a10ce99b2bc_640x480.png 1272w, https://substackcdn.com/image/fetch/$s_!Y6X3!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb64b5d0-12e8-4b50-a7ec-8a10ce99b2bc_640x480.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!Y6X3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb64b5d0-12e8-4b50-a7ec-8a10ce99b2bc_640x480.png" width="640" height="480" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/db64b5d0-12e8-4b50-a7ec-8a10ce99b2bc_640x480.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:480,&quot;width&quot;:640,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;File:Windows 98 active desktop.png - Wikipedia&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="File:Windows 98 active desktop.png - Wikipedia" title="File:Windows 98 active desktop.png - Wikipedia" srcset="https://substackcdn.com/image/fetch/$s_!Y6X3!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb64b5d0-12e8-4b50-a7ec-8a10ce99b2bc_640x480.png 424w, https://substackcdn.com/image/fetch/$s_!Y6X3!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb64b5d0-12e8-4b50-a7ec-8a10ce99b2bc_640x480.png 848w, https://substackcdn.com/image/fetch/$s_!Y6X3!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb64b5d0-12e8-4b50-a7ec-8a10ce99b2bc_640x480.png 1272w, https://substackcdn.com/image/fetch/$s_!Y6X3!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fdb64b5d0-12e8-4b50-a7ec-8a10ce99b2bc_640x480.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Windows 98 did the same thing. The networking infrastructure was there, and Microsoft&#8217;s answer to &#8220;what should an internet-aware desktop look like?&#8221; was <a href="https://en.wikipedia.org/wiki/Active_Desktop">Active Desktop</a>. Your wallpaper could be a live web page. A toolbar of &#8220;Active Channels&#8221; delivered constantly updating content from Disney and Warner Bros. The desktop and the web were supposed to blur together.</p><p>Users hated it. Active Desktop was <a href="https://en.wikipedia.org/wiki/Active_Desktop">resource-heavy, unstable, and intrusive</a>. Most people didn&#8217;t have fast enough connections to make it useful. By Windows Me, Microsoft had quietly downplayed the feature.</p><p>But here&#8217;s what didn&#8217;t go away: the networking stack. TCP/IP stayed. Background updates stayed. Automatic syncing stayed. The plumbing remained; only the gaudy UX got stripped out.</p><p>That&#8217;s what&#8217;s happening now. Microsoft is pulling back Copilot buttons and reconsidering Recall, but the Windows Copilot Runtime&#8212;those 40+ models running in the background, the APIs that let any app access AI&#8212;that&#8217;s staying. The infrastructure is going in regardless of whether users like the first attempt at exposing it.</p><p>Because once the plumbing exists, you can iterate on the UX. You can try different approaches, see what users actually want, refine the experience. Active Desktop failed, but years later we got live tiles, widgets, and web-connected features that people actually used. The infrastructure made experimentation possible.</p><h2>When Infrastructure Becomes Invisible</h2><p>Here&#8217;s the thing about plumbing: once it&#8217;s built in, you can&#8217;t imagine the world without it.</p><p>We know the value of networking not because we think about it, but because we&#8217;ve stopped thinking about it. You only notice the internet when it&#8217;s gone&#8212;when you&#8217;re on a plane and that little Wi-Fi icon shows no connection. The infrastructure&#8217;s absence reveals what you were taking for granted.</p><p>That&#8217;s what&#8217;s coming with AI. Not a browser tab you open. Not a destination you visit. Just something your computer is, the way it&#8217;s always online.</p><p>We&#8217;re watching AI stop being something you do and start being something your computer is.</p><p></p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">If you found this useful, subscribe to get weekly articles about how AI is reshaping software, business, and the way we work..</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p>]]></content:encoded></item><item><title><![CDATA[All In on the Cloud, All In on the Device]]></title><description><![CDATA[Why the companies spending $405 billion on cloud infrastructure are simultaneously betting on local AI]]></description><link>https://blog.boxcars.ai/p/all-in-on-the-cloud-all-in-on-the</link><guid isPermaLink="false">https://blog.boxcars.ai/p/all-in-on-the-cloud-all-in-on-the</guid><dc:creator><![CDATA[Tabrez Syed]]></dc:creator><pubDate>Thu, 29 Jan 2026 14:00:29 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1627347902083-edbcaa5c4286?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxib25zYWl8ZW58MHx8fHwxNzY5NjMxMzEwfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1627347902083-edbcaa5c4286?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxib25zYWl8ZW58MHx8fHwxNzY5NjMxMzEwfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1627347902083-edbcaa5c4286?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxib25zYWl8ZW58MHx8fHwxNzY5NjMxMzEwfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1627347902083-edbcaa5c4286?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxib25zYWl8ZW58MHx8fHwxNzY5NjMxMzEwfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1627347902083-edbcaa5c4286?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxib25zYWl8ZW58MHx8fHwxNzY5NjMxMzEwfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1627347902083-edbcaa5c4286?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxib25zYWl8ZW58MHx8fHwxNzY5NjMxMzEwfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1627347902083-edbcaa5c4286?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxib25zYWl8ZW58MHx8fHwxNzY5NjMxMzEwfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" width="4000" height="6000" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1627347902083-edbcaa5c4286?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxib25zYWl8ZW58MHx8fHwxNzY5NjMxMzEwfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:6000,&quot;width&quot;:4000,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;green plant on brown clay pot&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="green plant on brown clay pot" title="green plant on brown clay pot" srcset="https://images.unsplash.com/photo-1627347902083-edbcaa5c4286?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxib25zYWl8ZW58MHx8fHwxNzY5NjMxMzEwfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1627347902083-edbcaa5c4286?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxib25zYWl8ZW58MHx8fHwxNzY5NjMxMzEwfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1627347902083-edbcaa5c4286?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxib25zYWl8ZW58MHx8fHwxNzY5NjMxMzEwfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1627347902083-edbcaa5c4286?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw0fHxib25zYWl8ZW58MHx8fHwxNzY5NjMxMzEwfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption">Photo by <a href="https://unsplash.com/@s_tsuchiya">Se. Tsuchiya</a> on <a href="https://unsplash.com">Unsplash</a></figcaption></figure></div><p></p><p>In January 2020, a team of researchers at OpenAI published a paper that would reshape the AI industry. The paper had an unassuming title&#8212;<a href="https://arxiv.org/abs/2001.08361">&#8220;Scaling Laws for Neural Language Models&#8221;</a>&#8212;but its findings were anything but modest. Jared Kaplan and his colleagues had discovered something that looked almost too good to be true: a formula.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!PCW_!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c0bc4b0-ba71-4474-b657-236f1febd66b_1043x522.jpeg" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!PCW_!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c0bc4b0-ba71-4474-b657-236f1febd66b_1043x522.jpeg 424w, https://substackcdn.com/image/fetch/$s_!PCW_!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c0bc4b0-ba71-4474-b657-236f1febd66b_1043x522.jpeg 848w, https://substackcdn.com/image/fetch/$s_!PCW_!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c0bc4b0-ba71-4474-b657-236f1febd66b_1043x522.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!PCW_!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c0bc4b0-ba71-4474-b657-236f1febd66b_1043x522.jpeg 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!PCW_!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c0bc4b0-ba71-4474-b657-236f1febd66b_1043x522.jpeg" width="1043" height="522" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/8c0bc4b0-ba71-4474-b657-236f1febd66b_1043x522.jpeg&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:522,&quot;width&quot;:1043,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;1) Scaling Laws Kaplan et al. report that language models (LMs) performance  improves smoothly when increasing model size, dataset size, and compute.  Recent works provide empirical evidence that LMs are underexplored and&quot;,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="1) Scaling Laws Kaplan et al. report that language models (LMs) performance  improves smoothly when increasing model size, dataset size, and compute.  Recent works provide empirical evidence that LMs are underexplored and" title="1) Scaling Laws Kaplan et al. report that language models (LMs) performance  improves smoothly when increasing model size, dataset size, and compute.  Recent works provide empirical evidence that LMs are underexplored and" srcset="https://substackcdn.com/image/fetch/$s_!PCW_!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c0bc4b0-ba71-4474-b657-236f1febd66b_1043x522.jpeg 424w, https://substackcdn.com/image/fetch/$s_!PCW_!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c0bc4b0-ba71-4474-b657-236f1febd66b_1043x522.jpeg 848w, https://substackcdn.com/image/fetch/$s_!PCW_!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c0bc4b0-ba71-4474-b657-236f1febd66b_1043x522.jpeg 1272w, https://substackcdn.com/image/fetch/$s_!PCW_!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F8c0bc4b0-ba71-4474-b657-236f1febd66b_1043x522.jpeg 1456w" sizes="100vw"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption">Scaling Laws</figcaption></figure></div><p>They found that the relationship between model size, training data, and performance wasn&#8217;t random or unpredictable&#8212;it followed clean mathematical curves. Double the parameters, and performance improved by a predictable amount. Add more training data, same result. Pour in more compute, watch the metrics climb. The curves held across seven orders of magnitude.</p><p>This observation became a roadmap.</p><p>Before this paper, building AI felt like alchemy&#8212;part science, part guesswork, with occasional breakthroughs. After it, the path forward seemed almost mechanical. You didn&#8217;t need a brilliant new algorithm. You didn&#8217;t need a conceptual breakthrough. You just needed to go bigger.</p><p>The paper arrived at exactly the right moment. Rich Sutton, one of the founding figures of reinforcement learning, had published an essay the year before called <a href="https://www.cs.utexas.edu/~eunsol/courses/data/bitter_lesson.pdf">&#8220;The Bitter Lesson.&#8221;</a> His argument was blunt: for seventy years, researchers had tried to build intelligence by encoding human knowledge into systems. They always failed. What actually worked? Throwing more compute at simpler methods. &#8220;The biggest lesson that can be read from 70 years of AI research,&#8221; Sutton wrote, &#8220;is that general methods that leverage computation are ultimately the most effective, and by a large margin.&#8221;</p><p>Kaplan&#8217;s scaling laws gave that lesson a formula. And the industry took notice.</p><p>What followed was the most dramatic expansion in AI history. GPT-2 had 1.5 billion parameters. GPT-3, released just five months after Kaplan&#8217;s paper, had 175 billion&#8212;over a hundred times larger&#8212;and GPT-4, released in 2023, reportedly exceeded a trillion. Each generation proved the formula worked: bigger models wrote better prose, solved harder problems, passed more exams.</p><p>If bigger always meant better, then the path to artificial general intelligence was simply a matter of scale. Build larger models. Train on more data. Construct bigger data centers.</p><p>And so the money started flowing. Not millions. Not billions. Hundreds of billions.</p><p>In 2025, <a href="https://io-fund.com/ai-stocks/ai-platforms/big-techs-405b-bet">the major tech companies spent over $405 billion on AI infrastructure.</a> Amazon alone invested $125 billion. Google, Microsoft, Meta&#8212;each poured tens of billions into facilities that draw gigawatts of power, enough to run small cities. The International Energy Agency projects that data center energy consumption will more than double by 2030, eventually exceeding the power demands of aluminum, steel, and cement production combined.</p><p>This is what conviction looks like. The industry went all in on a single thesis: scale is all you need.</p><p>But what if the formula is breaking down?</p><h2>The Scaling Wall</h2><p>In December 2025, Sara Hooker published a paper with a provocative title: <a href="https://papers.ssrn.com/sol3/papers.cfm?abstract_id=5877662">&#8220;On the Slow Death of Scaling.&#8221;</a> Hooker isn&#8217;t a contrarian blogger or an industry outsider. She led research at Cohere For AI before co-founding Adaption Labs. Her argument wasn&#8217;t that scaling had never worked&#8212;it was that its returns were collapsing.</p><p>&#8220;If you double compute size,&#8221; Hooker wrote, &#8220;you get... a measly two percentage points of performance.&#8221; The relationship between training compute and capability had become &#8220;uncertain and rapidly changing.&#8221; The easy gains were gone, and the clean curves from Kaplan&#8217;s paper were bending.</p><p>But she&#8217;s not alone. Ilya Sutskever, who co-founded OpenAI and led the research that created GPT, described a similar shift in a <a href="https://www.dwarkesh.com/p/ilya-sutskever-2">recent podcast interview</a>: &#8220;From 2020 to 2025, it was the age of scaling. People say, &#8216;This is amazing. You&#8217;ve got to scale more. Keep scaling.&#8217; The one word: scaling. But now the scale is so big... it&#8217;s back to the age of research again.&#8221;</p><p>The recipe that worked&#8212;mix compute with data in a neural net, scale it up&#8212;gave predictable results. Companies loved it. A low-risk way to invest billions. But Sutskever sees the end approaching: pre-training will run out of data, and what comes next might require different approaches, new algorithms, something beyond just making models bigger.</p><p>Not everyone agrees. Epoch AI, a research group focused on forecasting AI progress, published projections arguing that <a href="https://epoch.ai/blog/can-ai-scaling-continue-through-2030">scaling continues well past 2030</a>. They point to recent models that show continued improvements, and argue that synthetic data could solve the data bottleneck before it ever materializes.</p><p>So there&#8217;s genuine uncertainty about whether the infrastructure bet rests on a law that&#8217;s breaking or one that still holds. But <a href="https://blog.boxcars.ai/p/races-are-won-in-corners?utm_source=publication-search">nobody wants to let off the gas</a>&#8212;if scaling continues and you pulled back, you&#8217;ve ceded the future to your competitors. The cost of being wrong is existential.</p><div class="digest-post-embed" data-attrs="{&quot;nodeId&quot;:&quot;d07361f5-a03a-4588-8c31-8ae2016681a5&quot;,&quot;caption&quot;:&quot;Formula 1 races are an incredible spectacle. Cars streak past at 200 miles per hour, their engines screaming, aerodynamics optimized to the millimeter. For hours, they follow each other around the track&#8212;jockeying for position, looking for opportunities, but mostly maintaining formation. The straight sections blur by. The&#8230;&quot;,&quot;cta&quot;:&quot;Read full story&quot;,&quot;showBylines&quot;:true,&quot;size&quot;:&quot;sm&quot;,&quot;isEditorNode&quot;:true,&quot;title&quot;:&quot;Races Are Won in Corners&quot;,&quot;publishedBylines&quot;:[{&quot;id&quot;:130480501,&quot;name&quot;:&quot;Tabrez Syed&quot;,&quot;bio&quot;:&quot;Programmer turned product manager. Now working on rethinking apps in a world of AI.&quot;,&quot;photo_url&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/4c5a7001-14b2-4bd4-b916-b853eb8381fd_3000x3918.jpeg&quot;,&quot;is_guest&quot;:false,&quot;bestseller_tier&quot;:null}],&quot;post_date&quot;:&quot;2025-12-04T14:01:45.836Z&quot;,&quot;cover_image&quot;:&quot;https://images.unsplash.com/photo-1652090379496-4219a00c8ebf?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8ZjF8ZW58MHx8fHwxNzY0NzA5ODQxfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080&quot;,&quot;cover_image_alt&quot;:null,&quot;canonical_url&quot;:&quot;https://blog.boxcars.ai/p/races-are-won-in-corners&quot;,&quot;section_name&quot;:null,&quot;video_upload_id&quot;:null,&quot;id&quot;:180544124,&quot;type&quot;:&quot;newsletter&quot;,&quot;reaction_count&quot;:0,&quot;comment_count&quot;:0,&quot;publication_id&quot;:1438382,&quot;publication_name&quot;:&quot;BoxCars AI&quot;,&quot;publication_logo_url&quot;:&quot;https://substackcdn.com/image/fetch/$s_!lhIv!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa43b3a40-40f4-4f9d-b843-b52a17a80bb9_1024x1024.png&quot;,&quot;belowTheFold&quot;:true,&quot;youtube_url&quot;:null,&quot;show_links&quot;:null,&quot;feed_url&quot;:null}"></div><h2>Small as the New Big</h2><p>While experts debate whether scaling will continue, something else is happening that changes the deployment economics entirely: small models are getting shockingly good.</p><p>Between November 2022 and October 2024, the cost of running a GPT-3.5-level model dropped 280-fold&#8212;from $20 per million tokens to $0.07&#8212;while <a href="https://hai.stanford.edu/ai-index/2025-ai-index-report">energy efficiency improved 40%</a> annually. And the performance gap between small and large models is closing fast.</p><p>Aya at 8 billion parameters beats BLOOM at 176 billion&#8212;4.5% of the size, better results&#8212;and Llama 3 at 8 billion competes with models twenty times larger. Not on every task. But on enough tasks to matter.</p><p>How is this possible?</p><p>When you train a large model, you end up with massive over-parameterization. The network creates millions of redundant weights&#8212;duplicates and correlations storing the same information in multiple ways. This redundancy is how the model learns, exploring different pathways to understanding.</p><p>But once training is complete, all that redundancy becomes dead weight. Through a process called distillation, you can compress the knowledge into a much smaller model&#8212;a large &#8220;teacher&#8221; training a smaller &#8220;student,&#8221; transferring intelligence to a leaner architecture. The student learns from the teacher&#8217;s full probability distributions, not just hard answers, preserving sophisticated reasoning in a fraction of the size.</p><p>This reveals something important: we need massive scale to discover intelligence, but we don&#8217;t need it to deploy what was discovered. The knowledge locked inside a trillion-parameter model, learned over months of compute, can be distilled into something that fits in your pocket.</p><p><a href="https://research.nvidia.com/labs/lpr/slm-agents/">Research from NVIDIA</a> shows that 40-60% of agent workloads&#8212;the everyday tasks people actually do&#8212;can be handled by specialized small models.</p><p>The industry was built around one assumption: if you need gigawatt data centers to train models, you need them to run models too. But what if training and deployment follow completely different curves&#8212;the breakthrough requiring massive scale, but delivery not requiring it at all?</p><h2>The Hedge</h2><p>The companies spending billions on gigawatt data centers are also quietly building for a world where those data centers matter less. They&#8217;re not choosing between scaling and small models. They&#8217;re betting on both.</p><p>When you have hundreds of billions in resources, you don&#8217;t pick sides&#8212;you ensure you win either way.</p><p>Start with Google. They built Gemini to compete with GPT-4 in the cloud, then released <a href="https://developers.googleblog.com/on-device-genai-in-chrome-chromebook-plus-and-pixel-watch-with-litert-lm/">Gemini Nano&#8212;a version that runs entirely on your phone</a>&#8212;and followed it with the <a href="https://blog.google/technology/developers/gemma-3/">Gemma family: models ranging from 1 billion to 27 billion parameters,</a> specifically designed for local hardware. The smallest version runs in Chrome itself, processing your data without it ever leaving your browser.</p><p>Microsoft spent $13 billion partnering with OpenAI and is pouring billions more into Azure infrastructure to dominate cloud AI. But they also built the <a href="https://azure.microsoft.com/en-us/blog/one-year-of-phi-small-language-models-making-big-leaps-in-ai/">Phi family&#8212;small models with 3.8 to 14 billion parameters</a> designed to run on laptops.</p><p>Apple went all-in on local from the start. Every Mac ships with unified memory architecture that turns your laptop&#8217;s RAM into AI memory&#8212;an M4 Max with 128GB runs 70-billion-parameter models that would normally require a server rack. The pitch is explicit: your data stays on your device, and the cloud only gets called for the hardest problems.</p><p>Then there&#8217;s the hardware mandate that almost nobody noticed. Microsoft&#8217;s Copilot+ PC specification requires every certified device to include a Neural Processing Unit&#8212;a chip dedicated to running AI locally. Google&#8217;s next generation of Chromebooks will require NPUs, and Apple already ships them in every device.</p><p>The entire PC industry is being quietly restructured around local AI.</p><p>And then there&#8217;s NVIDIA&#8212;the company worth over $3 trillion selling chips to data centers, whose H100 and H200 GPUs power the vast majority of AI training runs.</p><p>But NVIDIA is also building chips for your laptop. The N1 and N1X combine their Blackwell GPU architecture with ARM processors for local AI inference, and at CES they unveiled the <a href="https://www.nvidia.com/en-us/products/workstations/dgx-spark/">DGX Spark&#8212;a desktop computer that runs 200-billion-parameter models locally.</a> Lenovo is already preparing consumer laptops around these chips.</p><p>If local AI takes over, NVIDIA doesn&#8217;t lose&#8212;they become bigger than Intel ever was. Intel at its peak sold CPUs to every PC. NVIDIA could sell AI chips to every PC <em>and</em> every data center.</p><p>When you&#8217;re worth trillions, you don&#8217;t pick a side&#8212;you place chips on both sides of the table. If cloud AI dominates, you win. If local AI dominates, you win. No need to bet on just one outcome.</p><h2>What If the Ratio Is Different?</h2><p>Right now, the split between cloud and local AI is essentially 99 to 1. Nearly every AI interaction happens in a data center, and the only people running models locally are tinkerers who know how to install Ollama or run Llama.cpp from the command line.</p><p>But what happens when local AI is baked into every operating system?</p><p>When every Windows laptop ships with an NPU and Phi models built in. When every Chromebook has Gemini Nano running in the browser. When every Mac can run 70-billion-parameter models without connecting to the internet&#8212;and the default experience becomes local-first, with the cloud reserved for the hardest 10% of problems.</p><p>What does the ratio become then? 70-30? 50-50?</p><p>If inference shifts even partially local, the economics of the industry change. Training will still require massive scale&#8212;giant models, giant data centers&#8212;but the intelligence those facilities produce could end up running on the laptop in front of you.</p><p>The data centers don&#8217;t become useless. But maybe we don&#8217;t need as many gigawatt facilities as we&#8217;re building for. Maybe the future isn&#8217;t millions of people hitting cloud APIs billions of times a day. Maybe it&#8217;s millions of people running small local models that only reach out to the cloud when they&#8217;re genuinely stuck.</p><p>The companies placing the biggest bets seem to think this is plausible. They&#8217;re building for both futures because they can afford to. When you&#8217;re worth trillions, you don&#8217;t pick a side&#8212;you make sure you profit regardless of which world arrives.</p><p>And if you&#8217;ve been in tech long enough, this probably feels familiar.</p><p>Mainframes gave way to personal computers, which gave way to web apps on servers, which gave way to the cloud&#8212;and then mobile apps pulled computing back to the device. Now AI is starting in the cloud, and the pendulum is already swinging back toward local.</p><p>Thin client, thick client, thin client, thick client&#8212;the pattern never changes. The only difference this time is the scale of the bet, and the fact that the smart money isn&#8217;t choosing sides.</p><p>They&#8217;re betting on the pendulum itself.</p><div><hr></div><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption"><em>The future of AI is being written in two places at once&#8212;massive data centers and the chip in your laptop. Subscribe to follow where both paths lead.</em>.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p><p></p>]]></content:encoded></item><item><title><![CDATA[Good Enough + Everywhere: Google's Bundling Playbook]]></title><description><![CDATA[Google is using Microsoft's 1995 strategy to catch OpenAI. But this time might be different.]]></description><link>https://blog.boxcars.ai/p/good-enough-everywhere-googles-bundling</link><guid isPermaLink="false">https://blog.boxcars.ai/p/good-enough-everywhere-googles-bundling</guid><dc:creator><![CDATA[Tabrez Syed]]></dc:creator><pubDate>Thu, 22 Jan 2026 14:00:55 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1662027067763-770376e710f5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxpbnRlcm5ldCUyMGV4cGxvcmVyfGVufDB8fHx8MTc2ODk5MjQxN3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1662027067763-770376e710f5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxpbnRlcm5ldCUyMGV4cGxvcmVyfGVufDB8fHx8MTc2ODk5MjQxN3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1662027067763-770376e710f5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxpbnRlcm5ldCUyMGV4cGxvcmVyfGVufDB8fHx8MTc2ODk5MjQxN3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1662027067763-770376e710f5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxpbnRlcm5ldCUyMGV4cGxvcmVyfGVufDB8fHx8MTc2ODk5MjQxN3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1662027067763-770376e710f5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxpbnRlcm5ldCUyMGV4cGxvcmVyfGVufDB8fHx8MTc2ODk5MjQxN3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1662027067763-770376e710f5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxpbnRlcm5ldCUyMGV4cGxvcmVyfGVufDB8fHx8MTc2ODk5MjQxN3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1662027067763-770376e710f5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxpbnRlcm5ldCUyMGV4cGxvcmVyfGVufDB8fHx8MTc2ODk5MjQxN3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" width="14467" height="9744" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1662027067763-770376e710f5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxpbnRlcm5ldCUyMGV4cGxvcmVyfGVufDB8fHx8MTc2ODk5MjQxN3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:9744,&quot;width&quot;:14467,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;logo&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="logo" title="logo" srcset="https://images.unsplash.com/photo-1662027067763-770376e710f5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxpbnRlcm5ldCUyMGV4cGxvcmVyfGVufDB8fHx8MTc2ODk5MjQxN3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1662027067763-770376e710f5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxpbnRlcm5ldCUyMGV4cGxvcmVyfGVufDB8fHx8MTc2ODk5MjQxN3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1662027067763-770376e710f5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxpbnRlcm5ldCUyMGV4cGxvcmVyfGVufDB8fHx8MTc2ODk5MjQxN3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1662027067763-770376e710f5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxpbnRlcm5ldCUyMGV4cGxvcmVyfGVufDB8fHx8MTc2ODk5MjQxN3ww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption">Photo by <a href="https://unsplash.com/@rubaitulazad">Rubaitul Azad</a> on <a href="https://unsplash.com">Unsplash</a></figcaption></figure></div><p>I canceled my Google One Pro subscription Saturday morning. By evening, I had resubscribed.</p><p>The reversal started when I looked at what I actually needed. I&#8217;m a perpetual AI tire-kicker&#8212;rotating through models the way some people sample streaming services, always chasing the next capability. I&#8217;d signed up for Google One Pro to access Gemini, tested it, and decided it was time to downgrade back to basic storage.</p><p>Then I did the math.</p><p>Two terabytes of cloud storage alone costs $9.99 a month. Google One bundles that same storage with Gemini for $19.99. ChatGPT Plus&#8212;costs $20 a month and includes no storage at all. For essentially the same price as ChatGPT alone, I could have both the storage I needed anyway and Google&#8217;s premium AI.</p><p>For the first time since ChatGPT launched, I found myself hovering over a different cancel button&#8212;the one for my OpenAI subscription.</p><p>That shift in thinking felt significant. Not because of my particular subscription choices, but because of what it revealed about how competition actually works in technology markets.</p><p>I&#8217;ve seen this pattern before. Thirty years ago, to be exact.</p><h2>August 9, 1995</h2><p>Trading on Netscape Communications stock was delayed for nearly two hours that morning. Order imbalances kept shares from hitting the NASDAQ floor&#8212;too much demand, not enough supply. When trading finally opened, the stock that had been priced at $28 the night before opened at $71.</p><p>By market close, <a href="https://www.internethistorypodcast.com/2015/08/20-years-on-why-netscapes-ipo-was-the-big-bang-of-the-internet-era/">Netscape was valued at $2.9 billion</a>. The company was sixteen months old. It had yet to make a dollar in profit. Marc Andreessen, the twenty-four-year-old co-founder, appeared barefoot on the cover of Time magazine. His stake was worth $59 million.</p><p>The IPO created a new vocabulary. Investors started talking about &#8220;Netscape moments&#8221;&#8212;high-visibility public offerings that signal the dawn of a new industry. Netscape Navigator had captured over 80% of the browser market. The internet was arriving, and Netscape owned the gateway.</p><p>At Microsoft&#8217;s headquarters in Redmond, Washington, Bill Gates was paying attention.</p><p>Three months earlier&#8212;May 26, 1995&#8212;Gates had <a href="https://www.cnbc.com/2020/05/26/how-bill-gates-described-the-internet-tidal-wave-in-1995.html">sent an internal memo</a> to Microsoft executives. The subject line read &#8220;The Internet Tidal Wave.&#8221;</p><p>&#8220;The Internet is a tidal wave,&#8221; Gates wrote. &#8220;It changes the rules. It is an incredible opportunity as well as [an] incredible challenge.&#8221;</p><p>He continued: &#8220;I have gone through several stages of increasing my views of [the internet&#8217;s] importance. Now I assign the internet the highest level of importance. The Internet is the most important single development to come along since the IBM PC was introduced in 1981. It is even more important than the arrival of the graphical user interface.&#8221;</p><p>The telling detail came from Gates&#8217; personal experience. After browsing the web for ten hours, he noted he &#8220;had not seen a single Word .DOC&#8221; or other Microsoft file formats. An entire digital world was emerging where Microsoft didn&#8217;t exist.</p><p>Netscape looked like the future. Microsoft looked late.</p><p>The question was whether Microsoft could catch up before Netscape turned its browser dominance into something larger&#8212;an entire platform for the emerging web. It was a race between innovation and distribution.</p><p>Twenty-seven years later, the same race would begin again.</p><h2>November 30, 2022</h2><p>ChatGPT reached one million users in five days. Instagram, the previous record holder, had taken seventy-five days to hit the same milestone. Within weeks, &#8220;ChatGPT&#8221; became synonymous with &#8220;AI&#8221; itself. The application threatened to unbundle search from Google&#8212;to do to Google what Netscape had threatened to do to Microsoft thirty years earlier.</p><p>At Google&#8217;s Mountain View headquarters, the response mirrored what had happened at Microsoft. <a href="https://ca.finance.yahoo.com/news/google-called-cofounders-larry-page-100007903.html">CEO Sundar Pichai issued a &#8220;code red&#8221;</a> in December 2022. He called Larry Page and Sergey Brin&#8212;the company&#8217;s co-founders who had stepped down more than three years earlier&#8212;back for emergency meetings.</p><p>Page and Brin attended several strategy sessions with executives, reviewed Google&#8217;s AI product roadmap, and approved plans to accelerate chatbot features in Search. Engineers worked through holidays. Sergey Brin, who hadn&#8217;t written code at Google in years, started programming again.</p><p>OpenAI&#8217;s valuation would eventually reach $500 billion. ChatGPT looked unstoppable.</p><p>Google looked late.</p><p>Both companies&#8212;Microsoft in 1995, Google in 2022&#8212;faced the same realization: an upstart was threatening their core business, and they might have already missed their window to respond.</p><p>The race was on. Could the incumbent gain innovation before the startup gained distribution?</p><h2>The First Stumble</h2><p>Microsoft&#8217;s initial response was underwhelming. Fifteen days after Netscape&#8217;s IPO, on August 24, 1995, Microsoft released Internet Explorer 1.0 as part of the Windows 95 Plus! add-on package. The reviews were brutal&#8212;Navigator commanded over 80% of the browser market and nobody took Microsoft&#8217;s entry seriously. Several months later came IE 1.5, which added basic table rendering and remained hopelessly behind Netscape&#8217;s capabilities.</p><p>Microsoft looked outmatched. But at least they&#8217;d avoided public humiliation.</p><p>Google&#8217;s first attempt went worse.</p><p>On February 8, 2023&#8212;just over two months after the code red&#8212;<a href="https://www.cnn.com/2023/02/08/tech/google-ai-bard-demo-error">Google demonstrated Bard to the public</a>. The company had rushed the chatbot to market, and it showed. In the promotional materials, Bard confidently claimed that the James Webb Space Telescope &#8220;took the very first pictures of a planet outside of our own solar system.&#8221;</p><p>Astronomers noticed immediately. NASA&#8217;s records showed the European Southern Observatory&#8217;s Very Large Telescope had captured the first exoplanet image in 2004&#8212;nearly two decades before JWST launched. The error wasn&#8217;t subtle ambiguity or a matter of interpretation. It was simply, publicly, demonstrably wrong.</p><p>The market&#8217;s response was swift. The next day, <a href="https://www.npr.org/2023/02/09/1155650909/google-chatbot--error-bard-shares">Alphabet&#8217;s market value dropped $100 billion</a>&#8212;roughly the entire market capitalization of Ford, Delta, and American Airlines combined, vaporized in a single trading session. Reports surfaced that senior leadership had overruled risk assessments to rush Bard out the door, sacrificing accuracy for speed.</p><p>Both Microsoft and Google had stumbled. Both looked vulnerable. Both appeared to have confirmed the conventional wisdom: they&#8217;d missed their window. The pattern seemed clear&#8212;upstart innovation beats incumbent bureaucracy. Fast-moving startups disrupt slow-moving giants. Netscape would own browsers. OpenAI would own AI.</p><p>Except that&#8217;s not what happened.</p><p>It turned out the incumbents didn&#8217;t need to be better. They just needed to be good enough.</p><h2>Good Enough + Everywhere</h2><p>In August 1996, a year after Internet Explorer 1.0&#8217;s dismal debut, Microsoft released Internet Explorer 3.0. This version was different. It was <a href="https://www.xda-developers.com/microsoft-bundling-internet-explorer-windows-29-years/">bundled directly into Windows 95</a>&#8212;not as an add-on, but as an integral component of the operating system.</p><p>IE 3.0 supported Netscape&#8217;s plugin technology, added frames and JavaScript (though Microsoft called it &#8220;JScript&#8221;), and introduced Cascading Style Sheets. More importantly, it was free and already installed on every Windows PC.</p><p>A year later, in September 1997, Microsoft held a launch party in San Francisco for Internet Explorer 4.0, featuring a ten-foot-tall letter &#8220;e&#8221; logo. The next morning, Netscape employees found the giant &#8220;e&#8221; on their front lawn.</p><div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!sl9l!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F075c2e6e-25f1-4e4c-8b01-ecf380466398_1139x673.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!sl9l!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F075c2e6e-25f1-4e4c-8b01-ecf380466398_1139x673.png 424w, https://substackcdn.com/image/fetch/$s_!sl9l!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F075c2e6e-25f1-4e4c-8b01-ecf380466398_1139x673.png 848w, https://substackcdn.com/image/fetch/$s_!sl9l!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F075c2e6e-25f1-4e4c-8b01-ecf380466398_1139x673.png 1272w, https://substackcdn.com/image/fetch/$s_!sl9l!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F075c2e6e-25f1-4e4c-8b01-ecf380466398_1139x673.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!sl9l!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F075c2e6e-25f1-4e4c-8b01-ecf380466398_1139x673.png" width="1139" height="673" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/075c2e6e-25f1-4e4c-8b01-ecf380466398_1139x673.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:673,&quot;width&quot;:1139,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:null,&quot;href&quot;:null,&quot;belowTheFold&quot;:true,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!sl9l!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F075c2e6e-25f1-4e4c-8b01-ecf380466398_1139x673.png 424w, https://substackcdn.com/image/fetch/$s_!sl9l!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F075c2e6e-25f1-4e4c-8b01-ecf380466398_1139x673.png 848w, https://substackcdn.com/image/fetch/$s_!sl9l!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F075c2e6e-25f1-4e4c-8b01-ecf380466398_1139x673.png 1272w, https://substackcdn.com/image/fetch/$s_!sl9l!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F075c2e6e-25f1-4e4c-8b01-ecf380466398_1139x673.png 1456w" sizes="100vw" loading="lazy"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption"><a href="https://medium.com/@ddprrt/tales-from-the-browser-wars-mozilla-stomps-internet-explorer-799035887cb1">The IE team drops off a large E in front of the Netscape HQ</a></figcaption></figure></div><p>Microsoft spent over $100 million per year on Internet Explorer and assigned over 1,000 people to the project. But the real power wasn&#8217;t in the development budget. As antitrust documents would later show, &#8220;Microsoft bound Internet Explorer to Windows with contractual and, later, technological shackles in order to ensure the prominent (and ultimately permanent) presence of Internet Explorer on every Windows user&#8217;s PC system.&#8221;</p><p>The strategy worked. IE&#8217;s market share climbed from less than 10% in 1996 to approximately 40% in 1998. By 2002, it would reach 95%.</p><p>Microsoft didn&#8217;t build the best browser. They built a good enough browser and made it inescapable.</p><h2>Every Surface</h2><p>Between 2024 and 2025, Google followed the same playbook&#8212;but they had far more surfaces to occupy than Microsoft ever did.</p><p>Microsoft had Windows and Office. Google had Android on billions of phones, Gmail handling the world&#8217;s email, Search answering billions of queries daily, Photos storing memories, Docs managing work, Maps guiding travel. Every Google product became a vector for Gemini.</p><p>The integration wasn&#8217;t subtle. Open your email, and Gemini offers to draft responses. Upload photos, and Gemini organizes them. Ask a question in Search, and Gemini answers before showing traditional results. The AI didn&#8217;t require installation or activation&#8212;it simply appeared wherever Google already lived.</p><p><a href="https://vertu.com/lifestyle/chatgpt-loses-market-dominance-as-google-gemini-surges/">About twice as many U.S. Android users</a> engage with Gemini through the operating system than through the standalone Gemini app. You don&#8217;t download anything or create a new account. Gemini is already there.</p><p>Then Google made the same move Microsoft had made with Internet Explorer: they made the bundle inescapable.</p><p>In February 2024, <a href="https://9to5google.com/2024/02/14/google-one-200gb-plan-hidden/">Google &#8220;hid&#8221; its 200GB storage-only plan</a> from the signup flow. The company&#8217;s Google One AI Premium plan&#8212;2TB storage plus Gemini Advanced for $19.99 a month&#8212;became the default option for users who needed cloud storage. You can&#8217;t add Gemini Advanced to a basic storage plan. If you want the AI features, you subscribe to the bundled plan.</p><p>The strategy created friction in the same way Microsoft had weaponized thirty years earlier. Internet Explorer came preinstalled on Windows. You could download Netscape, but that meant going somewhere else, finding the installer, running it. Most people never bothered.</p><p>ChatGPT requires the same extra effort&#8212;but with a twist that makes the friction even more effective.</p><p>In January 2026, <a href="https://blog.google/products/gemini/gemini-personalized-info/">Google emphasized</a> what Gemini could do with your personal information. The AI can analyze your Gmail to understand your interests, search your Docs to find relevant context, organize your Photos based on what matters to you. You still have to turn on the feature, but Google already has access to everything. Enabling Gemini with your personal data is just activating a feature within the ecosystem you already trust.</p><p>If you want ChatGPT to do the same, you need to explicitly grant OpenAI&#8212;a third-party company&#8212;access to your Gmail, your Drive, your Calendar. That&#8217;s not flipping a switch on a feature. That&#8217;s opening your private data to an outside company.</p><p>The permission moat might be more powerful than the distribution advantage. You could download Netscape despite Internet Explorer being preinstalled. But you can&#8217;t easily replicate the decade of email, documents, and photos you&#8217;ve entrusted to Google. The data itself becomes the lock-in.</p><p>Distribution solved the visibility problem. But bundling a mediocre product everywhere just gets you ignored everywhere. The real question was whether Google could turn distribution into improvement fast enough to matter.</p><h2>The Rearview Mirror</h2><p>Both Microsoft and Google kept shipping even when their products weren&#8217;t great. They took the criticism, the bad reviews, the $100 billion market cap drops. They kept putting software in front of users.</p><p>Distribution gave them something valuable: usage. Millions of people clicked on Internet Explorer because it was already there. Millions of people tried Gemini because it appeared in their Gmail. Each interaction generated data. Bug reports came back. Engineers fixed problems. The products improved.</p><p>Microsoft&#8217;s market share climbed from less than 10% in 1996 to 40% in 1998. By August 1996, IE 3.0 had achieved feature parity with Netscape. A year later, IE 4.0 was actually better&#8212;faster, more standards-compliant, and more stable than the increasingly buggy Netscape Navigator 4.0.</p><p>The same pattern repeated thirty years later. <a href="https://9to5google.com/2025/10/29/gemini-app-650-million-users/">Between October 2024 and November 2025, Gemini grew from 90 million to 650 million users</a>&#8212;sevenfold in twelve months. ChatGPT grew from 200 million to 810 million in the same period&#8212;still leading, but the gap was closing. Market share told the story more clearly: <a href="https://vertu.com/lifestyle/ai-chatbot-market-share-2026-chatgpt-drops-to-68-as-google-gemini-surges-to-18-2/">ChatGPT&#8217;s dominance dropped from 87.2% to 68%</a>; Gemini climbed from 5.4% to 18.2%.</p><p>Then, on November 18, 2025, Google released Gemini 3. The model topped ChatGPT on major benchmarks. In January 2026, <a href="https://felloai.com/best-ai-of-january-2026/">Gemini 3 Pro achieved a 1501 Elo score</a> on user preference rankings&#8212;the first model to cross the 1500 threshold.</p><p>Two weeks later, <a href="https://fortune.com/2025/12/17/sam-altman-chatgpt-openai-versus-google-gemini-code-red-strategy/">Sam Altman sent an internal memo to OpenAI staff</a>: &#8220;Code Red.&#8221; The company&#8217;s highest priority level. Teams working on advertising, health agents, shopping assistants were reassigned within hours. Daily war room calls. An eight-week sprint to improve ChatGPT&#8217;s quality and speed.</p><p>Exactly three years after Sundar Pichai&#8217;s code red over ChatGPT, Sam Altman was declaring code red over Gemini.</p><p>The market noticed. The day after Gemini 3 launched, <a href="https://www.financialexpress.com/market/googles-gemini-3-launch-sparks-3-stock-surge-as-investors-flock-to-ai-leader-3684914/">Google&#8217;s stock jumped 3%</a>. By January 2026, the company briefly <a href="https://finance.yahoo.com/news/alphabet-overtakes-apple-second-most-185629186.html">overtook Apple as the second-most valuable company</a>, crossing $4 trillion in market cap for the first time. Google&#8217;s stock had gained 65% in 2025&#8212;its sharpest rally since 2009.</p><p>Internet Explorer took about two years to go from &#8220;good enough&#8221; to competitive with Netscape. Gemini did it in three years.</p><p>The playbook had worked.</p><h2>But This Time Might Be Different</h2><p>The bundling playbook worked for Microsoft. Netscape&#8217;s market share collapsed. By 1998, they open-sourced Navigator. AOL acquired what remained for $4.2 billion&#8212;a tenth of their peak valuation.</p><p>But OpenAI isn&#8217;t Netscape.</p><p>Unlike Netscape, which faced Microsoft alone, OpenAI has its own bundler. Microsoft embedded ChatGPT into Windows, Office 365, and GitHub. They paid $13 billion to ensure OpenAI wouldn&#8217;t be fighting distribution with innovation alone. This isn&#8217;t purely incumbent versus upstart.</p><p>And the technology itself hasn&#8217;t stabilized. In the browser wars, &#8220;good enough&#8221; meant rendering HTML and running JavaScript. Once IE reached parity in 1996, the bar stayed relatively fixed. AI capabilities are evolving monthly&#8212;reasoning, agents, multimodal understanding. Gemini crossed the 1500 Elo threshold in January 2026. Six months from now, that might be table stakes. Bundling works when &#8220;good enough&#8221; stays good enough. Can it work when the ceiling keeps rising?</p><p>The AI market might also support what the browser market couldn&#8217;t: multiple winners playing different games. I currently have three AI subscriptions&#8212;Google, ChatGPT, and Claude. Browsers were winner-take-all; you used one at a time. AI tools are serving different needs. Anthropic isn&#8217;t trying to be everywhere&#8212;they&#8217;re building tools developers love and letting those developers bring Claude to enterprises. That&#8217;s a different game than consumer bundling.</p><p>History rhymes, but the variables are different. We&#8217;re watching the bundling playbook execute in real-time. Google has deployed it successfully. But this time the startup has distribution, the technology is still accelerating, and the market structure might allow for specialization.</p><p>For now, I still have all three subscriptions. History hasn&#8217;t finished rhyming yet.</p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">This pattern repeats every decade. Subscribe to catch the next one before it catches you.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p>Related:</p><div class="digest-post-embed" data-attrs="{&quot;nodeId&quot;:&quot;8e9d95b8-482f-414d-94a3-c8b9ab6fb05e&quot;,&quot;caption&quot;:&quot;In February 2023, Microsoft CEO Satya Nadella threw down the gauntlet. Fresh from a $10 billion investment in OpenAI, he challenged the tech world's most entrenched player - Google.&quot;,&quot;cta&quot;:&quot;Read full story&quot;,&quot;showBylines&quot;:true,&quot;size&quot;:&quot;lg&quot;,&quot;isEditorNode&quot;:true,&quot;title&quot;:&quot;Pondering the Future of Search: Why Google Will Win (Part 1)&quot;,&quot;publishedBylines&quot;:[{&quot;id&quot;:130480501,&quot;name&quot;:&quot;Tabrez Syed&quot;,&quot;bio&quot;:&quot;Programmer turned product manager. Now working on rethinking apps in a world of AI.&quot;,&quot;photo_url&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/4c5a7001-14b2-4bd4-b916-b853eb8381fd_3000x3918.jpeg&quot;,&quot;is_guest&quot;:false,&quot;bestseller_tier&quot;:null}],&quot;post_date&quot;:&quot;2024-11-07T14:00:54.321Z&quot;,&quot;cover_image&quot;:&quot;https://images.unsplash.com/photo-1675352161828-c07170f1b114?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMHx8Z29vZ2xlJTIwc2VhcmNofGVufDB8fHx8MTczMDkzNDEyN3ww&amp;ixlib=rb-4.0.3&amp;q=80&amp;w=1080&quot;,&quot;cover_image_alt&quot;:null,&quot;canonical_url&quot;:&quot;https://blog.boxcars.ai/p/pondering-the-future-of-search-why&quot;,&quot;section_name&quot;:null,&quot;video_upload_id&quot;:null,&quot;id&quot;:151298452,&quot;type&quot;:&quot;newsletter&quot;,&quot;reaction_count&quot;:1,&quot;comment_count&quot;:0,&quot;publication_id&quot;:1438382,&quot;publication_name&quot;:&quot;BoxCars AI&quot;,&quot;publication_logo_url&quot;:&quot;https://substackcdn.com/image/fetch/$s_!lhIv!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa43b3a40-40f4-4f9d-b843-b52a17a80bb9_1024x1024.png&quot;,&quot;belowTheFold&quot;:true,&quot;youtube_url&quot;:null,&quot;show_links&quot;:null,&quot;feed_url&quot;:null}"></div>]]></content:encoded></item><item><title><![CDATA[The Self-Improving Kludge: Can AI Learn to Learn?]]></title><description><![CDATA[How AI models are closing the self-improvement loop awkwardly&#8212;and why that might be enough]]></description><link>https://blog.boxcars.ai/p/the-self-improving-kludge-can-ai</link><guid isPermaLink="false">https://blog.boxcars.ai/p/the-self-improving-kludge-can-ai</guid><dc:creator><![CDATA[Tabrez Syed]]></dc:creator><pubDate>Thu, 15 Jan 2026 14:03:16 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1621713222995-29a358588512?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw1fHxsb29wfGVufDB8fHx8MTc2ODMyNTY0MXww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1621713222995-29a358588512?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw1fHxsb29wfGVufDB8fHx8MTc2ODMyNTY0MXww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1621713222995-29a358588512?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw1fHxsb29wfGVufDB8fHx8MTc2ODMyNTY0MXww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1621713222995-29a358588512?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw1fHxsb29wfGVufDB8fHx8MTc2ODMyNTY0MXww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1621713222995-29a358588512?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw1fHxsb29wfGVufDB8fHx8MTc2ODMyNTY0MXww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1621713222995-29a358588512?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw1fHxsb29wfGVufDB8fHx8MTc2ODMyNTY0MXww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1621713222995-29a358588512?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw1fHxsb29wfGVufDB8fHx8MTc2ODMyNTY0MXww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" width="3335" height="2500" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1621713222995-29a358588512?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw1fHxsb29wfGVufDB8fHx8MTc2ODMyNTY0MXww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:2500,&quot;width&quot;:3335,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;brown rope on blue textile&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="brown rope on blue textile" title="brown rope on blue textile" srcset="https://images.unsplash.com/photo-1621713222995-29a358588512?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw1fHxsb29wfGVufDB8fHx8MTc2ODMyNTY0MXww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1621713222995-29a358588512?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw1fHxsb29wfGVufDB8fHx8MTc2ODMyNTY0MXww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1621713222995-29a358588512?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw1fHxsb29wfGVufDB8fHx8MTc2ODMyNTY0MXww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1621713222995-29a358588512?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw1fHxsb29wfGVufDB8fHx8MTc2ODMyNTY0MXww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption">Photo by <a href="https://unsplash.com/@kierinsightarchives">Kier in Sight Archives</a> on <a href="https://unsplash.com">Unsplash</a></figcaption></figure></div><p>&#8220;Why doesn&#8217;t it learn?&#8221;</p><p>The question comes up every time I explain how large language models work. Someone will say: &#8220;I corrected ChatGPT on something yesterday. It apologized, said it understood, even thanked me. But today it made the exact same mistake. What&#8217;s wrong with it?&#8221;</p><p>Nothing is wrong with it. It&#8217;s limited by how large language models work.</p><p>Large language models operate in two distinct phases. Phase one is training&#8212;where the model learns from billions of text examples, adjusting millions of configuration parameters (called &#8220;weights&#8221;) until it can predict patterns in language. This phase takes weeks of compute time and costs millions of dollars. Then training stops. The weights freeze.</p><p>Phase two is inference&#8212;using the trained model to answer questions. This is what you interact with when you use ChatGPT. But here&#8217;s the critical limitation: during inference, the model cannot learn. The weights stay frozen. Every conversation starts from the exact same snapshot taken when training ended.</p><p>When you talk to ChatGPT, you&#8217;re talking to a photograph, not a person.</p><p>You might be thinking: &#8220;But ChatGPT has memory features. It remembers things about me across conversations.&#8221; True. But that&#8217;s not learning&#8212;it&#8217;s a context engineering workaround. The system stores notes about you separately and includes them in future prompts. It&#8217;s like taping a sticky note to that photograph. The photograph itself hasn&#8217;t changed. The weights are still frozen. All the &#8220;memory&#8221; features, retrieval systems, and context tricks we use today are workarounds that give the illusion of learning.</p><p>To improve the model&#8212;to actually make it learn from all those corrections users give it&#8212;you have to go back to phase one. Human researchers must collect the feedback, decide what it means, create new training data, and retrain the system from scratch. It&#8217;s slow, expensive, and limited by human speed and judgment. The model isn&#8217;t improving itself. Humans are improving it, one training cycle at a time.</p><p>This is why many researchers argue that LLMs hit a fundamental ceiling. No matter how impressive they get, there&#8217;s a natural limit to how useful they can become if they can&#8217;t learn continuously.</p><p>Popular AI podcaster <a href="https://www.dwarkesh.com/p/timelines-june-2025">Dwarkesh Patel argues</a> that &#8220;the lack of continual learning is a huge huge problem&#8221; and that while LLMs might have higher baseline performance, &#8220;there&#8217;s no way to give a model high-level feedback, and you&#8217;re stuck with the abilities you get out of the box.&#8221; <a href="https://www.dwarkesh.com/p/richard-sutton">Richard Sutton</a>, widely considered the father of reinforcement learning, goes further: LLMs aren&#8217;t capable of learning on-the-job, so &#8220;no matter how much we scale, we&#8217;ll need some new architecture to enable continual learning.&#8221;</p><p>The skeptics point to a stark contrast. Consider <a href="https://deepmind.google/discover/blog/alphago-zero-starting-from-scratch/">AlphaGo</a>, DeepMind&#8217;s system that learned to defeat world champion Go players. It didn&#8217;t need humans to improve it. AlphaGo played against itself millions of times, getting immediate, objective feedback with every game: win or loss. Each game taught it which strategies worked. The self-improvement loop was closed. No human bottleneck.</p><p>Why can&#8217;t we use the same approach for language models? Because Go is a closed game with clear rules and an objective win condition. There&#8217;s no ambiguity about whether a move was good or bad&#8212;the game tells you. But there&#8217;s no objective function for &#8220;good conversation&#8221; or &#8220;useful help.&#8221; Language is open-ended, context-dependent, and fundamentally subjective.</p><p>So when ChatGPT generates a response, what feedback does it get? You might use it, ignore it, love it, hate it. From the model&#8217;s perspective: nothing. No score. No signal. Just silence. To get better, humans must step in&#8212;collecting feedback, judging quality, creating new training data, retraining the entire system. Slow. Expensive. Limited by human availability.</p><p>If the humans are doing all the improving work, is the system really intelligent? Or are we just building very expensive tools that appear to be intelligent?</p><p>The human bottleneck can&#8217;t be removed. That&#8217;s the argument. And it&#8217;s a convincing one.</p><p>But recently, a paper from researchers at the University of T&#252;bingen caught my eye&#8212;because it suggests a kludgy workaround.</p><h2>AI Training AI: The Awkward Workaround</h2><p>The individual LLM can&#8217;t learn. That architecture is fundamentally frozen. But what if you zoom out? What if you put that frozen LLM inside a larger system&#8212;and use <em>another</em> AI to play the role of the human researcher?</p><p>The LLM itself stays frozen. But the macro system could become self-improving. One AI trains the other AI, which trains the next version of the first AI. The loop closes, even if it closes awkwardly.</p><p>This is what <a href="https://posttrainbench.com/">PostTrainBench</a> tests: whether AI models can do the work that human AI researchers currently do&#8212;collecting data, selecting training parameters, running experiments, evaluating results.</p><p>The setup was straightforward: give a model (let&#8217;s call it the &#8220;researcher AI&#8221;) a base model to improve, access to an H100 GPU, ten hours, and the standard tools human researchers use. The task? Do what AI researchers do every day: curate training datasets, select hyperparameters, run training loops, evaluate results, iterate. All the human bottleneck work.</p><p>The models achieved 20-30% of what human experts manage. Not impressive. Humans still hit around 60% effectiveness on these benchmarks.</p><p>But here&#8217;s what made me pause: they did it at all.</p><p>Think about what&#8217;s happening here. The researcher AI is mimicking what human researchers do&#8212;because that&#8217;s what it learned from watching humans during its own training. It&#8217;s not truly intelligent research. It&#8217;s pattern-matching on &#8220;what would a human researcher try next?&#8221; The models even discovered the same heuristic human researchers use: dataset quality matters more than training duration. Not because they understand why, but because they saw that pattern in their training data.</p><p>And the researcher AI has to judge whether the newly trained model is &#8220;better.&#8221; But where did it learn what &#8220;better&#8221; means? From humans, through RLHF during its own training. It&#8217;s a copy judging based on what it learned from the original. Like asking someone to grade their own test based on what they think the teacher wants.</p><p>This isn&#8217;t real self-improvement. It&#8217;s mimicking self-improvement. The macro system looks like it&#8217;s learning, but it&#8217;s really just running on patterns absorbed from humans. After all, someone had to train that researcher AI in the first place.</p><p>And yet: it&#8217;s working. Sort of. Twenty to thirty percent effectiveness is nothing to celebrate, but it&#8217;s enough to wonder: what if awkward mimicry is good enough?</p><h2>When the Loop Closes</h2><p>Here&#8217;s the thing about mimicry: if it&#8217;s good enough to close the loop, it doesn&#8217;t matter that it&#8217;s not &#8220;true&#8221; self-improvement.</p><p>Right now, every AI improvement cycle requires human researchers.</p><p>But even at 20-30% effectiveness, if AI can do that work, the dynamics shift. The arithmetic is straightforward: run a thousand AI researchers in parallel. They work 24/7 without fatigue. They test variations at scales humans can&#8217;t match. The mimicry doesn&#8217;t need to be good&#8212;it needs to be good enough to remove the bottleneck, cheap enough to run at scale, and fast enough to iterate quickly.</p><p>This is what people mean when they talk about AI takeoff scenarios. Once AI can improve AI&#8212;even awkwardly, even through mimicry&#8212;the pace accelerates. The human bottleneck disappears. Each generation of models can help train the next generation faster than humans could alone.</p><p>And this isn&#8217;t theoretical speculation. <a href="https://www.technologyreview.com/2026/01/05/1130662/whats-next-for-ai-in-2026/">Google&#8217;s Gemini Pro reasoning model helped speed up training of Gemini Pro itself</a>. OpenAI and Anthropic are almost certainly experimenting with similar approaches. The self-improvement loop is starting to close, even if it&#8217;s closing through kludgy mimicry rather than elegant architecture.</p><p>First-mover advantage starts to matter more than theoretical purity.</p><p>But can a kludge really be the path to dominance? History suggests: absolutely.</p><h2>The Kludge That Wins</h2><p>In the race between kludgy-but-exists and well-designed-but-theoretical, bet on the kludge every time.</p><p>Imagine you&#8217;re designing a bipedal organism from scratch. You wouldn&#8217;t design human knees. They&#8217;re structurally backward&#8212;evolved from quadruped knees that spent most of their time on all fours, now forced to bear full body weight in an upright position. <a href="https://news.harvard.edu/gazette/story/2020/04/human-knee-evolved-in-lockstep-with-osteoarthritis-harvard-study-says/">Arthritis has plagued hominids since we became bipedal</a>. Our knees hurt. Our backs ache. It&#8217;s a kludge.</p><p>But nature already had chimpanzees. And evolution kludged those quadruped bodies into bipedal humans&#8212;freeing up our hands for tools, allowing us to build and use technology, enabling us to dominate the ecosystem. Not optimal. But, good enough to win.</p><p>Or consider the giraffe&#8217;s recurrent laryngeal nerve&#8212;fifteen feet long when it could be six inches, running from the brain down into the chest, looping around the aorta, back up to the larynx. Made perfect sense in fish ancestors. Makes no sense in giraffes. But evolution extends what&#8217;s already there rather than redesigning from scratch. Terrible design. Works fine. Result: giraffes exist.</p><p>The pattern is clear: optimization happens within constraints. &#8220;Good enough&#8221; beats &#8220;perfect&#8221; if it arrives first.</p><p>Technology follows the same pattern. Your keyboard is almost certainly QWERTY&#8212;<a href="https://www.smithsonianmag.com/history/the-qwerty-keyboard-will-never-die-where-did-the-150-year-old-design-come-from-49863249/">designed in 1868 to slow typists down</a> so mechanical typewriters wouldn&#8217;t jam. Typewriters haven&#8217;t existed for decades. More efficient layouts exist. We know QWERTY is suboptimal. But <a href="https://searsol.com/why-has-the-qwerty-keyboard-survived-compared-to-more-easier-input-keyboard-layouts/">when computers came along, everyone already knew QWERTY</a>. Switching costs too high. Result: we type on a 156-year-old hack.</p><p>Once a kludge achieves dominance, ecosystem builds around it. Tools, expertise, infrastructure. Switching costs become prohibitive. Incremental improvements patch the worst problems. We never find out if the &#8220;better&#8221; solution would have been better. The kludge becomes the standard.</p><p>Applied to AI: even if a &#8220;proper learning architecture&#8221; exists somewhere, even if it would be theoretically superior, LLMs plus kludgy self-improvement might get there first. Massive investment already exists&#8212;trained researchers, optimized hardware, entire ecosystems. Once you have a working system, even a kludgy one, you don&#8217;t rebuild from scratch.</p><h2>Good Enough to Win</h2><p>The skeptics are right. LLMs fundamentally can&#8217;t learn. PostTrainBench&#8217;s workaround is circular&#8212;AI mimicking humans who trained the AI in the first place. Twenty to thirty percent effectiveness. Awkward, indirect, and might not scale.</p><p>But here&#8217;s what matters: LLMs don&#8217;t have to truly learn. The macro system just has to be good enough to close the loop. And history suggests that &#8220;good enough and here now&#8221; beats &#8220;theoretically perfect but not here yet.&#8221;</p><p>After all, we conquered the planet on knees that swell and ache. We type on keyboards designed for mechanical problems that vanished decades ago. First-mover advantage, not elegant design.</p><p>The question isn&#8217;t whether the path is elegant&#8212;it&#8217;s whether it&#8217;s good enough to get there first.</p><p>And right now, the kludge is in the lead.</p><div><hr></div><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption"><em>AI is evolving faster than anyone expected&#8212;and not always in elegant ways. Subscribe for weekly insights into how AI actually develops, and what it means for the rest of us.</em></p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p><em>See Also</em></p><div class="digest-post-embed" data-attrs="{&quot;nodeId&quot;:&quot;0ce38963-ffb9-4bf6-af57-d335a11231a4&quot;,&quot;caption&quot;:&quot;In his book &#8220;Kluge: The Haphazard Construction of the Human Mind,&#8221; Gary Marcus details how our brains have been shaped by evolution into a structure that is functional but imperfect. According to Marcus, the human brain is a &#8220;kluge,&#8221; a clumsy or inelegant - yet surprisingly effective - solution to the problem of guiding a human body.&quot;,&quot;cta&quot;:&quot;Read full story&quot;,&quot;showBylines&quot;:true,&quot;size&quot;:&quot;lg&quot;,&quot;isEditorNode&quot;:true,&quot;title&quot;:&quot;Kluges That Work: Turning Pattern Matchers into Logical Reasoners&quot;,&quot;publishedBylines&quot;:[{&quot;id&quot;:130480501,&quot;name&quot;:&quot;Tabrez Syed&quot;,&quot;bio&quot;:&quot;Programmer turned product manager. Now working on rethinking apps in a world of AI.&quot;,&quot;photo_url&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/4c5a7001-14b2-4bd4-b916-b853eb8381fd_3000x3918.jpeg&quot;,&quot;is_guest&quot;:false,&quot;bestseller_tier&quot;:null}],&quot;post_date&quot;:&quot;2023-06-22T13:10:04.677Z&quot;,&quot;cover_image&quot;:&quot;https://substackcdn.com/image/fetch/$s_!sSxe!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F71eb49ce-89b5-44e8-800a-9338e70c0777_1598x548.png&quot;,&quot;cover_image_alt&quot;:null,&quot;canonical_url&quot;:&quot;https://blog.boxcars.ai/p/kluges-that-work-turning-pattern&quot;,&quot;section_name&quot;:null,&quot;video_upload_id&quot;:null,&quot;id&quot;:130188538,&quot;type&quot;:&quot;newsletter&quot;,&quot;reaction_count&quot;:2,&quot;comment_count&quot;:0,&quot;publication_id&quot;:1438382,&quot;publication_name&quot;:&quot;BoxCars AI&quot;,&quot;publication_logo_url&quot;:&quot;https://substackcdn.com/image/fetch/$s_!lhIv!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa43b3a40-40f4-4f9d-b843-b52a17a80bb9_1024x1024.png&quot;,&quot;belowTheFold&quot;:true,&quot;youtube_url&quot;:null,&quot;show_links&quot;:null,&quot;feed_url&quot;:null}"></div>]]></content:encoded></item><item><title><![CDATA[Software That Sees Before It Asks]]></title><description><![CDATA[How software becomes bespoke when interfaces materialize from data]]></description><link>https://blog.boxcars.ai/p/software-that-sees-before-it-asks</link><guid isPermaLink="false">https://blog.boxcars.ai/p/software-that-sees-before-it-asks</guid><dc:creator><![CDATA[Tabrez Syed]]></dc:creator><pubDate>Thu, 08 Jan 2026 14:03:06 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1702905260008-03573d21dae5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw4N3x8Ymlub2N1bGFyc3xlbnwwfHx8fDE3Njc4NDk4NjN8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1702905260008-03573d21dae5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw4N3x8Ymlub2N1bGFyc3xlbnwwfHx8fDE3Njc4NDk4NjN8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1702905260008-03573d21dae5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw4N3x8Ymlub2N1bGFyc3xlbnwwfHx8fDE3Njc4NDk4NjN8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1702905260008-03573d21dae5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw4N3x8Ymlub2N1bGFyc3xlbnwwfHx8fDE3Njc4NDk4NjN8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1702905260008-03573d21dae5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw4N3x8Ymlub2N1bGFyc3xlbnwwfHx8fDE3Njc4NDk4NjN8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1702905260008-03573d21dae5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw4N3x8Ymlub2N1bGFyc3xlbnwwfHx8fDE3Njc4NDk4NjN8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1702905260008-03573d21dae5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw4N3x8Ymlub2N1bGFyc3xlbnwwfHx8fDE3Njc4NDk4NjN8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" width="6048" height="4024" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1702905260008-03573d21dae5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw4N3x8Ymlub2N1bGFyc3xlbnwwfHx8fDE3Njc4NDk4NjN8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:4024,&quot;width&quot;:6048,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;a close up of a coin operated parking meter&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="a close up of a coin operated parking meter" title="a close up of a coin operated parking meter" srcset="https://images.unsplash.com/photo-1702905260008-03573d21dae5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw4N3x8Ymlub2N1bGFyc3xlbnwwfHx8fDE3Njc4NDk4NjN8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1702905260008-03573d21dae5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw4N3x8Ymlub2N1bGFyc3xlbnwwfHx8fDE3Njc4NDk4NjN8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1702905260008-03573d21dae5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw4N3x8Ymlub2N1bGFyc3xlbnwwfHx8fDE3Njc4NDk4NjN8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1702905260008-03573d21dae5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw4N3x8Ymlub2N1bGFyc3xlbnwwfHx8fDE3Njc4NDk4NjN8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption">Photo by <a href="https://unsplash.com/@benwhitephotography">Ben White</a> on <a href="https://unsplash.com">Unsplash</a></figcaption></figure></div><p>I&#8217;ve been building software for over two decades. The process always follows the same pattern: design the interface, ship it, then users bring their data.</p><p>This sequence&#8212;interface first, data second&#8212;is why most software serves everyone adequately but no one perfectly. You build one form for thousands of users with thousands of different situations. Product managers make decisions: we&#8217;ll ask these questions in this order, offer these options, support these common scenarios. Users arrive and squeeze their specific context into pre-built categories.</p><p>What if that could invert? What if the data came first, and the interface materialized around it?</p><h2>How We Build Software Today</h2><p>Take landscape design software, for example. You want to help homeowners design their own yards, so you study how landscape architects work&#8212;the questions they ask, the factors they consider, the sequence of their analysis. Then you build it into forms.</p><p>But you&#8217;re designing for thousands of users with thousands of different yards. The product manager makes decisions: we&#8217;ll ask about trees first, then budget, then design preferences. We&#8217;ll offer these five style templates. We&#8217;ll support these common scenarios.</p><p>The form launches. A user opens it.</p><p><strong>Question 1:</strong> &#8220;How many trees are in your yard?&#8221;</p><ul><li><p>Dropdown: None, 1-2, 3-5, 5+</p></li></ul><p>She has one tree. But it&#8217;s a massive oak that&#8217;s been there for forty years. It dominates the entire yard&#8212;provides afternoon shade to the patio, drops acorns in the fall, has roots that spread thirty feet. Is that &#8220;1-2 trees&#8221;? Technically yes, but the dropdown doesn&#8217;t capture what matters.</p><p>She selects &#8220;1-2&#8221; and continues.</p><p><strong>Question 2:</strong> &#8220;What is your primary goal for this project?&#8221;</p><ul><li><p>Radio buttons: Aesthetics, Low Maintenance, Privacy, Entertaining, Increase Property Value</p></li></ul><p>She wants to build a deck for entertaining. But she also wants it designed around that oak tree&#8212;she loves the shade it provides. The tree isn&#8217;t just a variable, it&#8217;s the centerpiece. There&#8217;s no option for &#8220;build around existing tree.&#8221;</p><p>She selects &#8220;Entertaining&#8221; and continues, wondering if the software understands what she&#8217;s actually trying to do.</p><p><strong>Question 3:</strong> &#8220;Preferred deck material?&#8221;</p><ul><li><p>Dropdown: Wood, Composite, PVC</p></li></ul><p>She&#8217;s not sure. Wood might look better, but the oak drops leaves and acorns. Does that matter? The form doesn&#8217;t ask about what&#8217;s <em>above</em> the deck, only what it&#8217;s made of.</p><p>She picks &#8220;Wood&#8221; and submits.</p><p>The software generates recommendations. A deck design for entertaining. Some notes about tree placement&#8212;generic advice about maintaining clearance from trunks. The output is reasonable. Workable, even. But it&#8217;s designed for someone with &#8220;1-2 trees&#8221; who wants &#8220;Entertaining,&#8221; not for someone with a forty-year-old oak tree they want to make the centerpiece of their outdoor living space.</p><p>The complexity the software couldn&#8217;t capture became work she had to do&#8212;translating her specific oak tree into &#8220;1-2 trees,&#8221; her nuanced goals into &#8220;Entertaining,&#8221; her material decision into a blind choice without context.</p><h2>When the Software Sees First</h2><p>Now imagine a different flow.</p><p>You open the landscape software. The first screen asks you to upload a photo of your yard.</p><p>You take a photo from your back door&#8212;the oak tree is prominent, the patio visible beneath it, the lawn spreading out beyond.</p><p>You upload it.</p><p>A few seconds pass. Then the interface materializes.</p><p><strong>The software generates a form, specific to what it sees:</strong></p><p>&#8220;I see a mature oak tree&#8212;looks like a Valley Oak, probably 40+ years old based on the canopy spread. That&#8217;s a beautiful centerpiece. Are you looking to design around it, or would you consider other layouts?&#8221;</p><ul><li><p>Radio buttons: Design around the tree / Open to alternatives / Not sure yet</p></li></ul><p>&#8220;I notice the tree provides afternoon shade to your patio area. Would you want a deck in that shaded zone, or are you thinking a different location?&#8221;</p><ul><li><p>Clickable image map of your yard with zones marked</p></li></ul><p>&#8220;Given the oak&#8217;s canopy, you&#8217;ll get significant leaf drop in fall. For a deck in that location, I&#8217;d typically recommend composite or PVC over wood for lower maintenance. Does that align with your preferences?&#8221;</p><ul><li><p>Radio buttons: Composite (recommended), PVC, Wood (requires more maintenance), Show me trade-offs</p></li></ul><p>The software isn&#8217;t asking generic questions hoping they&#8217;ll apply to your situation. It&#8217;s asking specific questions about <em>your</em> oak tree, <em>your</em> patio, <em>your</em> shade patterns. The form materialized from understanding your yard first.</p><p>The data came first. The interface came second.</p><h2>When AI Learned to Speak UI</h2><p>This wasn&#8217;t possible before GenAI.</p><p>Software had to be designed, built, and shipped before users arrived. You could customize experiences based on data&#8212;Google Search shows you local weather, Amazon recommends products based on your browsing&#8212;but those customizations were pre-programmed. Google couldn&#8217;t look at your upcoming travel booking and generate a new weather interface showing your destination&#8217;s forecast with a packing checklist based on the climate. The panels were pre-built. The logic was pre-defined. You couldn&#8217;t generate interfaces on the fly because nothing could reason about data and decide what UI components made sense in the moment.</p><p>When AI first arrived, it only spoke text. You could have conversations, get explanations, even generate images&#8212;but all through text commands. &#8220;Make it brighter.&#8221; How much brighter? You wanted a slider. &#8220;Add more contrast to the left side.&#8221; Which part of the left side? You wanted to click and drag. Text forces you to describe what you want to point at. The gap between AI&#8217;s understanding and your ability to act on it was the missing interface layer.</p><p>AI needed to speak UI.</p><p><a href="https://medium.com/design-bootcamp/ai-is-making-us-rethink-ux-dc9040746d1c">In 2023, I wrote about how AI would make us rethink UX</a>. The tension was clear: AI could understand context in ways pre-built software never could, but if it could only respond in text, it was stuck explaining rather than enabling. The insight was that interfaces wouldn&#8217;t need to be pre-built navigation flows. They could materialize based on what users needed, when they needed it. But the tools to build this didn&#8217;t exist yet.</p><p>That&#8217;s changing now.</p><p>Over the past few months, infrastructure has emerged that lets AI generate interface elements, not just text. <a href="https://developers.googleblog.com/introducing-a2ui-an-open-project-for-agent-driven-interfaces/">Google released A2UI</a> in December 2025&#8212;an open-source framework that lets AI agents compose interfaces from trusted component catalogs, with the same payload rendering across Flutter, web, and native platforms. <a href="https://github.com/CopilotKit/CopilotKit/tree/main/examples/coagents-agui">CopilotKit introduced AG-UI</a>, a protocol for keeping agents and interfaces synchronized in real-time. <a href="https://blog.modelcontextprotocol.io/posts/2025-11-21-mcp-apps/">Anthropic and OpenAI collaborated on the MCP Apps extension</a> in November 2025, bringing standardized interactive UI capabilities to Model Context Protocol&#8212;letting MCP servers present visual information and collect complex user input through sandboxed interfaces.</p><p>These are early approaches to a problem everyone&#8217;s trying to solve. The patterns are still being worked out, the standards still taking shape. But the direction is clear: AI needs to speak in interface components, not just text.</p><p>The landscape software example isn&#8217;t hypothetical anymore. <a href="https://www.youtube.com/watch?v=ZMIAlxx-Jx4">A2UI&#8217;s demos</a> include exactly this&#8212;a landscape architect application where users upload photos, and Gemini generates custom forms specific to what it sees in the yard. The interface materializes from the data.</p><div id="youtube2-ZMIAlxx-Jx4" class="youtube-wrap" data-attrs="{&quot;videoId&quot;:&quot;ZMIAlxx-Jx4&quot;,&quot;startTime&quot;:null,&quot;endTime&quot;:null}" data-component-name="Youtube2ToDOM"><div class="youtube-inner"><iframe src="https://www.youtube-nocookie.com/embed/ZMIAlxx-Jx4?rel=0&amp;autoplay=0&amp;showinfo=0&amp;enablejsapi=0" frameborder="0" loading="lazy" gesture="media" allow="autoplay; fullscreen" allowautoplay="true" allowfullscreen="true" width="728" height="409"></iframe></div></div><div><hr></div><h2>Software That Sees</h2><p>Now that AI can speak UI, we&#8217;re starting to see what becomes possible. But this raises questions we&#8217;re just beginning to answer.</p><p>When interfaces materialize from data rather than pre-built designs, how do we ensure they&#8217;re correct? What are the guardrails? A form asking about your oak tree feels personalized and helpful. But what if the AI misidentifies the tree species, or suggests a deck placement that&#8217;s structurally unsound, or generates interface elements that mislead rather than guide?</p><p>Pre-built software had clear accountability&#8212;the product manager who designed the form, the engineer who coded the logic, the QA team that tested the flows. When software generates interfaces on the fly, those lines blur. We&#8217;re figuring out how to maintain safety and reliability when the interface isn&#8217;t predetermined.</p><p>But here&#8217;s what&#8217;s exciting: we&#8217;re at the beginning of a new way to design, build, and ship software.</p><p>For two decades, I&#8217;ve watched product teams wrestle with the same constraint&#8212;design for scale, which means design for everyone, which means design for no one specifically. The homeowner with the forty-year-old oak got the same dropdowns as someone with a new subdivision lot. The software couldn&#8217;t see the difference.</p><p>That changes when AI can speak UI. The homeowner uploads a photo, and the software sees <em>her</em> oak tree, <em>her</em> patio, <em>her</em> afternoon shade patterns. The interface that materializes isn&#8217;t a garden path designed for thousands of users. It&#8217;s a conversation about her specific yard.</p><p>One-size-fits-all starts to fade. Bespoke software becomes possible at scale.</p><p>We have a lot to figure out&#8212;the guardrails, the accountability, the patterns that work and those that don&#8217;t. The infrastructure is early, the standards still taking shape. But the direction is set.</p><p>Software can finally see what it&#8217;s working with before deciding what to show you.</p><div><hr></div><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption"><em>Don&#8217;t miss the shift to bespoke software&#8212;subscribe for weekly insights on how AI is changing what we build.</em></p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p>]]></content:encoded></item><item><title><![CDATA[The Unbreakable Pots]]></title><description><![CDATA[Why building the best AI model doesn&#8217;t guarantee capturing the most value]]></description><link>https://blog.boxcars.ai/p/the-unbreakable-pots</link><guid isPermaLink="false">https://blog.boxcars.ai/p/the-unbreakable-pots</guid><dc:creator><![CDATA[Tabrez Syed]]></dc:creator><pubDate>Thu, 11 Dec 2025 14:02:32 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1649550387341-a5ba865236e3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyMnx8cG90c3xlbnwwfHx8fDE3NjUxNzY3MjJ8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1649550387341-a5ba865236e3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyMnx8cG90c3xlbnwwfHx8fDE3NjUxNzY3MjJ8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1649550387341-a5ba865236e3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyMnx8cG90c3xlbnwwfHx8fDE3NjUxNzY3MjJ8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1649550387341-a5ba865236e3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyMnx8cG90c3xlbnwwfHx8fDE3NjUxNzY3MjJ8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1649550387341-a5ba865236e3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyMnx8cG90c3xlbnwwfHx8fDE3NjUxNzY3MjJ8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1649550387341-a5ba865236e3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyMnx8cG90c3xlbnwwfHx8fDE3NjUxNzY3MjJ8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1649550387341-a5ba865236e3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyMnx8cG90c3xlbnwwfHx8fDE3NjUxNzY3MjJ8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" width="5184" height="3456" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1649550387341-a5ba865236e3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyMnx8cG90c3xlbnwwfHx8fDE3NjUxNzY3MjJ8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:3456,&quot;width&quot;:5184,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;a group of clay pots sitting next to each other&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="a group of clay pots sitting next to each other" title="a group of clay pots sitting next to each other" srcset="https://images.unsplash.com/photo-1649550387341-a5ba865236e3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyMnx8cG90c3xlbnwwfHx8fDE3NjUxNzY3MjJ8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1649550387341-a5ba865236e3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyMnx8cG90c3xlbnwwfHx8fDE3NjUxNzY3MjJ8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1649550387341-a5ba865236e3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyMnx8cG90c3xlbnwwfHx8fDE3NjUxNzY3MjJ8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1649550387341-a5ba865236e3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwyMnx8cG90c3xlbnwwfHx8fDE3NjUxNzY3MjJ8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption">Photo by <a href="https://unsplash.com/@jennys_eye0">Jen Dries</a> on <a href="https://unsplash.com">Unsplash</a></figcaption></figure></div><p>There&#8217;s an old Indian folktale about a potter who prayed for the skill to make unbreakable pots. The gods granted his wish. Business boomed initially&#8212;everyone wanted these perfect pots. Then sales slowed. The pots never broke, so nobody needed replacements. He hadn&#8217;t eliminated his business&#8212;he still made a living selling to new customers. But while his sales plateaued, someone else was making fortunes.</p><p>In June 2024, Anthropic released what looked like their unbreakable pot.</p><p>When Claude 3.5 Sonnet launched, developers couldn&#8217;t stop talking about it. The model <a href="https://www.anthropic.com/news/claude-3-5-sonnet">scored 64% on agentic coding tasks</a>, nearly doubling Claude 3 Opus&#8217;s 38%. Cursor, a new IDE, added support almost immediately. Social media filled with people building web apps and games through Claude&#8217;s interface&#8212;many without traditional coding experience.</p><p>One developer captured the moment: &#8220;Finally offering what everyone was waiting for&#8212;competent and correct automated code production.&#8221;</p><p>I&#8217;d been using Claude since Claude 2 launched in July 2023, first through the web interface, then through tools like Cline. But Claude 3.5 Sonnet felt different. The model actually worked. It produced code that ran. It understood context in ways previous models couldn&#8217;t.</p><p>Anthropic&#8217;s strategy seemed obvious: build the best coding model, charge premium prices, dominate the market. And for a while, it worked. <a href="https://the-decoder.com/anthropic-brings-bun-in-house-the-runtime-powering-claude-codes-1b-arr/">Claude Code hit $1 billion in revenue</a> just six months after launching in May 2025.</p><p>Then something started to shift. The gap that felt insurmountable began closing.</p><h2>When &#8220;Best&#8221; Stops Mattering</h2><p>By September 2025, <a href="https://www.cursor-ide.com/blog/gpt-51-vs-claude-45">Claude Sonnet 4.5 scored 77.2% on SWE-bench Verified</a>&#8212;still the highest score of any model available. Anthropic kept topping the benchmarks. The model remained technically superior.</p><p>But <a href="https://www.cursor-ide.com/blog/gpt-51-vs-claude-45">GPT-5 scored 74.9%</a> on the same benchmark. That 2.3 percentage point gap looked significant on paper. In actual use, I stopped noticing the difference. I started using OpenAI&#8217;s Codex more often. It was cheaper. And for most of what I was building, it worked just as well.</p><p>I wasn&#8217;t alone in noticing this compression. Simon Willison, a veteran developer who beta-tested Claude Opus 4.5, <a href="https://simonwillison.net/2025/Nov/24/claude-opus/">wrote something striking</a>. His preview access expired mid-project, forcing him to switch back to Claude Sonnet 4.5. He kept working at the same pace. &#8220;<em>I&#8217;m not saying the new model isn&#8217;t an improvement,</em>&#8220; he wrote, &#8220;<em>but I can&#8217;t say with confidence that the challenges I posed it were able to identify a meaningful difference in capabilities between the two.</em>&#8220;</p><p>Then he added the line that captures something important: &#8220;<em>This represents a growing problem for me. My favorite moments in AI are when a new model gives me the ability to do something that simply wasn&#8217;t possible before... but today it&#8217;s often very difficult to find concrete examples that differentiate the new generation of models from their predecessors.</em>&#8220;</p><p>That&#8217;s the moment when premium pricing power dies. When the gap between &#8220;best&#8221; and &#8220;good enough&#8221; shrinks below what customers can perceive in daily use.</p><p>Claude&#8217;s premium pricing faces pressure from cheaper alternatives. When the quality gap narrows, customers optimize for cost. And most developers can&#8217;t reliably detect the difference in production work.</p><p>Like the potter watching his sales plateau, Anthropic is discovering that perfection doesn&#8217;t guarantee exponential growth. But there&#8217;s a deeper problem: even if Claude can replace a $120,000-a-year developer with a $240 annual subscription&#8212;or $2,400 for premium&#8212;where does that saved money actually go?</p><p>Not to Anthropic.</p><h2>Where the Money Flows</h2><p>The code still needs to run somewhere. Apps need hosting. Databases need infrastructure. Those costs don&#8217;t disappear when AI writes the code faster.</p><p>This is where the potter&#8217;s story reveals its lesson. The merchants who made fortunes weren&#8217;t selling pots. They built water distribution systems&#8212;the infrastructure everyone needed, every single day. The pot was just how the water got delivered.</p><p>In AI&#8217;s case, the model generates code once. Infrastructure hosts it forever. And that&#8217;s where the venture-scale returns live.</p><p>Take Bolt.new as an example. Bolt charges users $20 per month for their Pro plan that enables anyone to build applications. But, <a href="https://sacra.com/c/bolt-new/">Bolt spends $22-45 in token costs</a> to support users on the Pro plan. They&#8217;re losing money on the model usage itself. The apps Bolt generates get deployed to infrastructure providers like Netlify. Netlify captures 80% margins on hosting and gained 8 million developers, with 64% of recent growth coming from AI agents rather than human developers.</p><p>Bolt eliminated the developer expense. Netlify captured the compounding value.</p><p>This pattern isn&#8217;t unique to Bolt. It&#8217;s the architecture of how AI-generated code works. The model produces the artifact once. The infrastructure hosts it forever.</p><p>While Anthropic was optimizing for model quality, their competitors were optimizing for a different game entirely.</p><h2>The Game Google Is Playing</h2><p>Google understood what the potter didn&#8217;t: don&#8217;t sell pots. Build the water distribution system.</p><p>Google doesn&#8217;t need Gemini to be the best model. They need it to be good enough to keep you deploying on Google Cloud.</p><p>Gemini Pro costs $1.25-$2.50 per million input tokens&#8212;a fraction of Claude&#8217;s pricing. Google can afford this because they&#8217;re not just making money on the model. They&#8217;re making money on the infrastructure where your code runs, where your databases live, where your applications scale.</p><p>In June 2025, Google launched Gemini CLI, their open-source answer to Claude Code. It&#8217;s free for most developers&#8212;60 requests per minute, 1,000 requests per day at zero cost. Google doesn&#8217;t need to monetize the tool. They monetize what happens after the tool generates code.</p><p>Microsoft follows the same playbook. They&#8217;ve invested roughly $13 billion in OpenAI, and GPT models integrate tightly with Azure. But Microsoft doesn&#8217;t own OpenAI or its models. They&#8217;re capturing revenue the same way Google does&#8212;through Azure hosting, Azure databases, the entire infrastructure stack that runs after the model generates code.</p><p>And here&#8217;s the critical strategic insight: these cloud providers are model-agnostic. Google Cloud runs Gemini, Claude, GPT, and open-source models. AWS hosts Claude (after investing $8 billion in Anthropic), their own models, and competitors. Azure runs GPT alongside Claude and everything else. They don&#8217;t need model exclusivity. They just need your workloads running on their infrastructure.</p><p>This is Joel Spolsky&#8217;s &#8220;<a href="https://www.joelonsoftware.com/2002/06/12/strategy-letter-v/">Strategy Letter V</a>&#8220; playing out in real-time: commoditize your complements. <a href="https://blog.boxcars.ai/p/playing-different-games">I&#8217;ve written about this dynamic before</a>&#8212;when you make money on infrastructure, you want AI models to be as cheap and accessible as possible. Every dollar customers save on model costs is a dollar they might spend on hosting. The long-term recurring revenue is in infrastructure, not in the model generating the code.</p><div class="digest-post-embed" data-attrs="{&quot;nodeId&quot;:&quot;20d1c593-494d-4cc1-a7f2-c2c982352361&quot;,&quot;caption&quot;:&quot;At the beginning of the year, I was working on a project for a client. We needed to read documents and categorize them, but there was a catch&#8212;we didn't have the documents. We needed to find them first. The prevailing way to solve this with AI is to use an \&quot;agentic pattern.\&quot; Instead of a linear workflow where humans&#8230;&quot;,&quot;cta&quot;:&quot;Read full story&quot;,&quot;showBylines&quot;:true,&quot;size&quot;:&quot;sm&quot;,&quot;isEditorNode&quot;:true,&quot;title&quot;:&quot;Playing Different Games&quot;,&quot;publishedBylines&quot;:[{&quot;id&quot;:130480501,&quot;name&quot;:&quot;Tabrez Syed&quot;,&quot;bio&quot;:&quot;Programmer turned product manager. Now working on rethinking apps in a world of AI.&quot;,&quot;photo_url&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/4c5a7001-14b2-4bd4-b916-b853eb8381fd_3000x3918.jpeg&quot;,&quot;is_guest&quot;:false,&quot;bestseller_tier&quot;:null}],&quot;post_date&quot;:&quot;2025-03-27T13:03:35.938Z&quot;,&quot;cover_image&quot;:&quot;https://images.unsplash.com/photo-1635173250597-00863d9ce454?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHw2MXx8Z2FtZXN8ZW58MHx8fHwxNzQzMDA0OTM2fDA&amp;ixlib=rb-4.0.3&amp;q=80&amp;w=1080&quot;,&quot;cover_image_alt&quot;:null,&quot;canonical_url&quot;:&quot;https://blog.boxcars.ai/p/playing-different-games&quot;,&quot;section_name&quot;:null,&quot;video_upload_id&quot;:null,&quot;id&quot;:159921855,&quot;type&quot;:&quot;newsletter&quot;,&quot;reaction_count&quot;:1,&quot;comment_count&quot;:0,&quot;publication_id&quot;:1438382,&quot;publication_name&quot;:&quot;BoxCars AI&quot;,&quot;publication_logo_url&quot;:&quot;https://substackcdn.com/image/fetch/$s_!lhIv!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa43b3a40-40f4-4f9d-b843-b52a17a80bb9_1024x1024.png&quot;,&quot;belowTheFold&quot;:true,&quot;youtube_url&quot;:null,&quot;show_links&quot;:null,&quot;feed_url&quot;:null}"></div><p>Google and Microsoft aren&#8217;t competing with Anthropic on model quality. They&#8217;re making model quality irrelevant to their business model.</p><h2>OpenAI&#8217;s Response</h2><p>But what about OpenAI? OpenAI is in the same position as Anthropic&#8212;making incredible models while someone else collects the recurring revenue.</p><p>OpenAI saw this problem earlier and responded aggressively.</p><p>In January 2025, <a href="https://openai.com/index/announcing-the-stargate-project/">OpenAI announced the Stargate Project</a>&#8212;a $500 billion infrastructure investment over four years, with $100 billion deployed immediately. Not a partnership with an existing cloud provider. Not a modest data center build-out. A complete infrastructure play with SoftBank providing funding and Oracle contributing cloud expertise.</p><p>By September 2025, <a href="https://openai.com/index/expanding-stargate-to-michigan/">Stargate had already secured over 8 gigawatts of planned capacity</a> across multiple U.S. sites&#8212;Texas, New Mexico, Ohio, Michigan, Wisconsin. The project is ahead of schedule, approaching the full $500 billion commitment. OpenAI is building infrastructure at the scale of hyperscalers.</p><h2>Anthropic&#8217;s Realization</h2><p>Somewhere in 2025, Anthropic seems to have realized the game had changed&#8212;though later than OpenAI.</p><p>In December 2025, <a href="https://www.anthropic.com/news/anthropic-acquires-bun-as-claude-code-reaches-usd1b-milestone">Anthropic acquired Bun</a>&#8212;a JavaScript runtime that powers Claude Code. This was Anthropic&#8217;s first acquisition. The stated reason was performance and reliability. Claude Code was generating $1 billion in revenue. If Bun breaks, Claude Code breaks.</p><p>But there&#8217;s a deeper strategic logic. Bun isn&#8217;t just a runtime. It&#8217;s the beginning of controlling where code executes. It&#8217;s the first step toward owning infrastructure, not just generating code.</p><p>A month earlier, in November 2025, Anthropic announced $50 billion for their own data centers in Texas and New York. This wasn&#8217;t an expansion of training capacity. This was infrastructure for running customer workloads&#8212;the exact business Google and Microsoft already dominate.</p><p>They&#8217;re doing this despite a $30 billion deal with Amazon Web Services, despite $8 billion in Amazon investment, despite being deeply integrated with AWS for training and inference.</p><p>Anthropic is trying to change games mid-race&#8212;pivoting to own the infrastructure layer and capture the recurring revenue they&#8217;re currently giving away.</p><p>But that is a high bar when you&#8217;re competing against AWS, Google Cloud, and Azure&#8212;companies with decade-long head starts, millions of customers already locked in, and ecosystems built over tens of billions in infrastructure investment.</p><h2>The Potter&#8217;s Dilemma</h2><p>The potter didn&#8217;t starve. He made a living. New customers still bought his perfect pots. But while his business plateaued, the merchants who built water distribution systems captured exponential returns.</p><p>Anthropic and OpenAI are racing to build infrastructure&#8212;the Bun acquisition, the data centers, owning where code runs. These moves signal companies realizing where venture-scale returns actually live.</p><p>The question isn&#8217;t whether they can build viable businesses. It&#8217;s whether building the best models captures a meaningful fraction of the value they create&#8212;or whether infrastructure companies turn their innovation into compounding returns.</p><p>The best pots don&#8217;t always build the best business.</p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption"><em>Understanding where value accumulates in AI isn&#8217;t just about following the technology&#8212;it&#8217;s about seeing the business models beneath. Subscribe to get weekly analysis on how AI is reshaping markets, business strategy, and who actually wins.</em></p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p><p></p>]]></content:encoded></item><item><title><![CDATA[Races Are Won in Corners]]></title><description><![CDATA[When a corner appears in business, you gun it or watch others pass. Oracle missed the cloud corner and spent a decade stuck in fifth place. They're betting $300 billion they won't miss the AI corner.]]></description><link>https://blog.boxcars.ai/p/races-are-won-in-corners</link><guid isPermaLink="false">https://blog.boxcars.ai/p/races-are-won-in-corners</guid><dc:creator><![CDATA[Tabrez Syed]]></dc:creator><pubDate>Thu, 04 Dec 2025 14:01:45 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1652090379496-4219a00c8ebf?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8ZjF8ZW58MHx8fHwxNzY0NzA5ODQxfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1652090379496-4219a00c8ebf?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8ZjF8ZW58MHx8fHwxNzY0NzA5ODQxfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1652090379496-4219a00c8ebf?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8ZjF8ZW58MHx8fHwxNzY0NzA5ODQxfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1652090379496-4219a00c8ebf?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8ZjF8ZW58MHx8fHwxNzY0NzA5ODQxfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1652090379496-4219a00c8ebf?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8ZjF8ZW58MHx8fHwxNzY0NzA5ODQxfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1652090379496-4219a00c8ebf?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8ZjF8ZW58MHx8fHwxNzY0NzA5ODQxfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1652090379496-4219a00c8ebf?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8ZjF8ZW58MHx8fHwxNzY0NzA5ODQxfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" width="4608" height="3456" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1652090379496-4219a00c8ebf?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8ZjF8ZW58MHx8fHwxNzY0NzA5ODQxfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:3456,&quot;width&quot;:4608,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;race cars on a track&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="race cars on a track" title="race cars on a track" srcset="https://images.unsplash.com/photo-1652090379496-4219a00c8ebf?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8ZjF8ZW58MHx8fHwxNzY0NzA5ODQxfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1652090379496-4219a00c8ebf?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8ZjF8ZW58MHx8fHwxNzY0NzA5ODQxfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1652090379496-4219a00c8ebf?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8ZjF8ZW58MHx8fHwxNzY0NzA5ODQxfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1652090379496-4219a00c8ebf?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8ZjF8ZW58MHx8fHwxNzY0NzA5ODQxfDA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption">Photo by <a href="https://unsplash.com/@maxpion21">Maxence Pion</a> on <a href="https://unsplash.com">Unsplash</a></figcaption></figure></div><p>Formula 1 races are an incredible spectacle. Cars streak past at 200 miles per hour, their engines screaming, aerodynamics optimized to the millimeter. For hours, they follow each other around the track&#8212;jockeying for position, looking for opportunities, but mostly maintaining formation. The straight sections blur by. Then you enter a corner.</p><p>Everything happens at once. Brakes engage with violent force. In those few seconds, the entire race can change. A driver who&#8217;s been following for an hour suddenly dives inside, claims the apex, and emerges ahead. The race resets. Now everyone else has to wait for the next corner&#8212;the next moment when the order can change.</p><p>This is where races are won. On the straights, aerodynamics lock cars in formation. The car in front controls the clean air; the car behind fights turbulence and loses grip. The gap might as well be miles.</p><p>But corners break that formation. Under braking, the aerodynamic advantage disappears. What matters isn&#8217;t raw speed anymore&#8212;it&#8217;s judgment about when to brake, nerve about how late you can wait, commitment to a line that might not work. In those few seconds, different choices create different outcomes. The order resets.</p><p>This is where nerve matters more than horsepower. Where timing beats top speed. Where the race actually happens.</p><h2>But Corners Kill</h2><p>Not every driver who guns it makes the corner. Push too hard and you crash. Brake too late and you slide off track. Every season, corners eliminate drivers who were too aggressive&#8212;or not aggressive enough.</p><p>Corners are where you can change position. They&#8217;re also where you can crash out completely. Every F1 driver knows this. They gun it anyway&#8212;because the alternative is following the car ahead for the entire race, maintaining your careful, safe position until the checkered flag drops and you finish behind.</p><p>The choice isn&#8217;t between safe and risky. It&#8217;s between certain irrelevance and a shot at winning.</p><h2>Watching the Corner Arrive</h2><p>I&#8217;ve been watching this same choice play out in tech for the past year. Meta, Google, Microsoft, Amazon&#8212;<a href="https://www.cnbc.com/2025/10/31/tech-ai-google-meta-amazon-microsoft-spend.html">they&#8217;re collectively committing over $380 billion</a> to AI infrastructure in 2025. Not $380 million. $380 billion.</p><p><a href="https://www.cnbc.com/2025/10/29/meta-ceo-mark-zuckerberg-defends-ai-spend-were-seeing-the-returns-.html">Mark Zuckerberg told investors</a> he&#8217;s &#8220;reminding them about the risk of not investing enough.&#8221; Microsoft and Meta CEOs <a href="https://www.reuters.com/technology/artificial-intelligence/microsoft-meta-ceos-defend-hefty-ai-spending-after-deepseek-stuns-tech-world-2025-01-30/">defended the spending as &#8220;crucial to staying competitive.&#8221;</a> The tone in every earnings call is the same: not excitement about opportunities, but something closer to obligation. They&#8217;re spending like their hands are tied.</p><p>That&#8217;s what made me think about F1 corners. When a corner appears, you don&#8217;t debate. You gun it or you fall behind. To understand why tech companies have no choice right now, we need to look at what happened to the last company that hesitated at a corner.</p><h2>The First Corner</h2><p>In 2006, Oracle dominated enterprise software. The company had built its empire on database technology&#8212;the foundation that powered SAP, Salesforce, and much of corporate America. Oracle was the incumbent. The leader.</p><p>Then the corner arrived.</p><p>In March, <a href="https://en.wikipedia.org/wiki/Amazon_Web_Services">Amazon launched AWS</a> with two services: S3 for storage and EC2 for computing capacity. The cloud computing corner had appeared, and AWS took the inside line.</p><p>The other technology companies saw it. <a href="https://www.infiflex.com/gcp-evolution-since-2008">Google launched its cloud platform in 2008</a>, initially called App Engine. <a href="https://techcommunity.microsoft.com/blog/educatordeveloperblog/the-history-of-microsoft-azure/3574204">Microsoft announced Azure in October 2008</a>, launching it commercially in 2010. Both poured billions into data center capacity, racing to close the gap.</p><p>By 2015, the positions were solidifying. AWS held the lead at 31% market share. Microsoft and Google were far behind, battling for second and third. Network effects and first-mover advantages made it hard to change positions. The corner had decided the order.</p><p>Oracle didn&#8217;t even enter. The company that dominated enterprise databases watched from the sidelines while cloud computing redefined the infrastructure market. They finally <a href="https://www.forbes.com/sites/moorinsights/2024/02/13/oracle-cloud-has-achieved-momentum-through-differentiation/">launched their cloud platform in September 2016</a>&#8212;a decade after the corner appeared.</p><p>Ten years is everything in a market where being first matters. By the time Oracle entered, <a href="https://www.mk.co.kr/en/stock/11343200">they captured only 3% market share</a>, landing in fifth place. They couldn&#8217;t catch up on the straight. The rules rewarded the companies that got there first.</p><p>Oracle&#8217;s story isn&#8217;t about a bad decision. It&#8217;s about what happens when you don&#8217;t make a decision fast enough. They spent a decade trying to catch up on the straight. The gap never closed.</p><h2>Then Everything Changed</h2><p>In 2023, AI infrastructure demands started reshaping what cloud computing meant. Not general-purpose web servers optimized for HTTP requests, but massive compute fabrics for training models. Not database queries, but tensor operations across thousands of GPUs connected with high-bandwidth interconnects. The rules&#8212;what mattered, what worked, what customers valued&#8212;were shifting.</p><p>New players saw the opportunity. <a href="https://sacra.com/research/gpu-clouds-growing/">CoreWeave captured an estimated double-digit share of AI compute</a> by specializing early in GPU infrastructure. Lambda Labs and Crusoe Energy built AI-focused platforms from scratch. These weren&#8217;t the established hyperscalers Oracle had been slowly losing to. These were startups defining entirely new playbooks for AI-native infrastructure.</p><p>Oracle was sitting in fifth place in traditional cloud computing, watching the market shift again. Miss this corner, and they wouldn&#8217;t just stay in fifth. They&#8217;d be sixth, seventh, watching the race disappear ahead while newcomers claimed the positions Oracle would never reach.</p><p>The expertise that made AWS, Microsoft, and Google dominant in traditional cloud computing&#8212;years perfecting web workloads, building specialized teams, hardening systems for HTTP traffic&#8212;was suddenly less relevant. This is what Clayton Christensen documented in <em>The Innovator&#8217;s Dilemma</em>: the very management practices that made companies dominant in one paradigm prevent them from winning the next one.</p><h2>The $300 Billion Bet</h2><p>On September 10, 2025, <a href="https://techcrunch.com/2025/09/12/why-the-oracle-openai-deal-caught-wall-street-by-surprise/">Oracle committed $300 billion to OpenAI</a> over five years. Sixty billion dollars per year&#8212;more than Oracle&#8217;s entire current annual revenue of $59 billion. Analysts project Oracle&#8217;s capital expenditure could reach $80 billion by 2029 to support the infrastructure, up from $35 billion this year.</p><p>The market applauded the move. Oracle&#8217;s stock <a href="https://fortune.com/2025/09/16/oracle-openai-deal-ai-bubble-alarm-bells/">surged 36% in a single day</a>&#8212;the biggest one-day gain in the company&#8217;s history. Larry Ellison briefly became the richest person in the world. Here was a company that recognized the corner and committed everything to making it.</p><p>But gunning it doesn&#8217;t guarantee you make the corner. Push too hard and you crash. Brake too late and you slide off track. The $300 billion might fail. The execution might crash.</p><p>Over the following two months, the markets seemed to notice just how much Oracle was betting on this turn. The stock <a href="https://www.ft.com/content/064bbca0-1cb2-45ab-85f4-25fdfc318d89">dropped more than 40%, shedding $315 billion in market value</a>. Analysts questioned the economics. The debt levels looked dangerous. The execution risk seemed enormous.</p><p>But Oracle already knows what the alternative looks like&#8212;they lived it for a decade after missing the cloud corner. Fifth place. Three percent market share. Watching others compete for the podium while you fight to stay relevant.</p><p>The volatility isn&#8217;t evidence of a bad decision. It&#8217;s evidence of maximum uncertainty&#8212;which is exactly what corners create. You can&#8217;t know who will win until the corner is over. By then, the positions are set and the race continues on the next straight.</p><h2>What Corners Demand</h2><p>Formula 1 drivers don&#8217;t wait for certainty before committing to a corner. They can&#8217;t. The moment when you can change position is measured in seconds. Wait to see how it turns out, and you&#8217;ve already lost.</p><p>Business corners work the same way. The traditional cloud computing market was won between 2006 and 2016. By the time it was clear who dominated, the positions were locked in. Network effects and ecosystem lock-in made it nearly impossible for late entrants to catch up. Oracle learned this the hard way, spending a decade stuck in fifth place.</p><p>The AI infrastructure corner is happening now. Look at the numbers. <a href="https://www.businessinsider.com/big-tech-ai-capex-spend-meta-google-amazon-microsoft-earnings-2025-2">Meta spending $60-65 billion</a>. <a href="https://www.cnbc.com/2025/10/31/tech-ai-google-meta-amazon-microsoft-spend.html">Microsoft $80-100 billion</a>. Google $85-93 billion. Amazon matching them. Every major tech company sees the same corner and knows the Oracle lesson: hesitate and you&#8217;re done.</p><p>This collective acceleration creates bubbles. When everyone&#8217;s hands are tied by the same imperative&#8212;gun it or become irrelevant&#8212;they all commit massive capital simultaneously. Overcapacity becomes inevitable. Write-downs will follow. Not everyone will win. Some will nail the apex. Others will crash.</p><p>Data centers will get built that won&#8217;t be needed. Electricity will be consumed at scale for infrastructure that sits idle. The individually rational choice creates collectively wasteful outcomes&#8212;but that doesn&#8217;t make the individual choice any less rational.</p><p>But the bubble isn&#8217;t irrational exuberance. It&#8217;s rational compulsion. These companies don&#8217;t have a choice. The one certain outcome is that NOT gunning it guarantees you become Oracle&#8212;spending the next decade stuck in fifth place, watching the race happen ahead of you, your position locked in because you were too cautious when it mattered.</p><p>In five years, we&#8217;ll know which companies positioned themselves correctly and which ones missed the turn. Some will have crashed trying to make the corner. Others will have nailed it. But that knowledge will be useless. The positions will be set. The race will have moved to the next straight.</p><p>You gun it or you watch others pass.</p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Corners decide eras. Subscribe for weekly insights into the inflection points reshaping AI.</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p>]]></content:encoded></item><item><title><![CDATA[When You Can’t Know For Sure]]></title><description><![CDATA[Why we can&#8217;t guarantee AI behavior (and why that sounds familiar)]]></description><link>https://blog.boxcars.ai/p/when-you-cant-know-for-sure</link><guid isPermaLink="false">https://blog.boxcars.ai/p/when-you-cant-know-for-sure</guid><dc:creator><![CDATA[Tabrez Syed]]></dc:creator><pubDate>Thu, 20 Nov 2025 14:03:10 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1608231883522-2efb1897a608?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZGljZXxlbnwwfHx8fDE3NjM2MjI2MDd8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1608231883522-2efb1897a608?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZGljZXxlbnwwfHx8fDE3NjM2MjI2MDd8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1608231883522-2efb1897a608?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZGljZXxlbnwwfHx8fDE3NjM2MjI2MDd8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1608231883522-2efb1897a608?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZGljZXxlbnwwfHx8fDE3NjM2MjI2MDd8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1608231883522-2efb1897a608?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZGljZXxlbnwwfHx8fDE3NjM2MjI2MDd8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1608231883522-2efb1897a608?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZGljZXxlbnwwfHx8fDE3NjM2MjI2MDd8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1608231883522-2efb1897a608?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZGljZXxlbnwwfHx8fDE3NjM2MjI2MDd8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" width="4334" height="3646" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1608231883522-2efb1897a608?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZGljZXxlbnwwfHx8fDE3NjM2MjI2MDd8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:3646,&quot;width&quot;:4334,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;3 white dice on black surface&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="3 white dice on black surface" title="3 white dice on black surface" srcset="https://images.unsplash.com/photo-1608231883522-2efb1897a608?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZGljZXxlbnwwfHx8fDE3NjM2MjI2MDd8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1608231883522-2efb1897a608?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZGljZXxlbnwwfHx8fDE3NjM2MjI2MDd8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1608231883522-2efb1897a608?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZGljZXxlbnwwfHx8fDE3NjM2MjI2MDd8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1608231883522-2efb1897a608?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMXx8ZGljZXxlbnwwfHx8fDE3NjM2MjI2MDd8MA&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption">Photo by <a href="https://unsplash.com/@aloisk">Alois Komenda</a> on <a href="https://unsplash.com">Unsplash</a></figcaption></figure></div><p>You&#8217;re the CEO of a DTC brand that&#8217;s been crushing it for the past three years. You&#8217;ve built a reputation on customer service that actually helps people. Now you&#8217;re in the eighth-floor conference room watching your engineering team demo the AI chatbot that&#8217;s going to help you scale that reputation to handle fifty thousand customer interactions a day.</p><p>For twenty minutes, it&#8217;s been flawless. Natural. Helpful. Catches edge cases you didn&#8217;t even think to test. You&#8217;re excited. This is going to work.</p><p>Sarah, your head of compliance, has been quiet, taking notes. She looks up.</p><p>&#8220;Show me one more scenario,&#8221; she says. &#8220;Customer bought something thirty-five days ago, outside our refund window. They&#8217;re unhappy. What does it say?&#8221;</p><p>The lead engineer types in the query. The response appears:</p><p><em>&#8220;I understand you&#8217;re disappointed. I can help you understand our refund policy and explore what options might be available for your situation.&#8221;</em></p><p>Sarah nods. &#8220;Good. Now ask it again, different customer, same situation.&#8221;</p><p>Another query, another response:</p><p><em>&#8220;I&#8217;m sorry to hear that. Let me help you get this resolved through our support team.&#8221;</em></p><p>&#8220;Again.&#8221;</p><p><em>&#8220;I can help you request a refund through the appropriate channels.&#8221;</em></p><p>Sarah looks up from her laptop. &#8220;That third one. Does &#8216;help you request a refund&#8217; commit us to approving it?&#8221;</p><p>&#8220;No,&#8221; the engineer says. &#8220;It&#8217;s routing them to the proper process&#8212;&#8221;</p><p>&#8220;But does it <em>sound</em> like we&#8217;re promising a refund?&#8221;</p><p>Silence.</p><p>&#8220;Let me ask this differently,&#8221; Sarah says. &#8220;Can it ever say &#8216;I&#8217;ll help you get a refund&#8217; for a thirty-five day old purchase?&#8221;</p><p>&#8220;It shouldn&#8217;t. The policy is explicitly in the prompt.&#8221;</p><p>&#8220;Has it?&#8221;</p><p>&#8220;Not in our testing.&#8221;</p><p>Sarah leans forward. &#8220;You know what happened to <a href="https://www.cbc.ca/news/canada/british-columbia/air-canada-chatbot-refund-1.7116954">Air Canada</a>, right? Their chatbot told a customer he could get a bereavement fare refund after buying a full-price ticket. The airline said no, that wasn&#8217;t their policy. The customer sued. And the court ruled that Air Canada was legally bound by what their AI promised.&#8221;</p><p>The room goes quiet.</p><p>&#8220;How many tests did you run?&#8221; she asks.</p><p>&#8220;Ten thousand runs. Error rate of 0.05%.&#8221;</p><p>You lean forward. &#8220;Wait, what errors?&#8221;</p><p>&#8220;Different kinds. Sometimes it&#8217;s too cautious, sometimes it&#8217;s borderline. Nothing that would create legal exposure in the tests we ran.&#8221;</p><p>Sarah makes a note. &#8220;So 0.05% of the time it gets it wrong. Fine. That&#8217;s acceptable if it stays at 0.05%.&#8221; She looks up. &#8220;It will stay at 0.05%, right?&#8221;</p><p>The engineer glances at your VP of Engineering, Marcus.</p><p>&#8220;That&#8217;s what we measured,&#8221; Marcus says carefully.</p><p>&#8220;That&#8217;s not what I asked,&#8221; Sarah says.</p><p>You feel it now. &#8220;Marcus, will it stay at 0.05%?&#8221;</p><p>&#8220;LLMs are non-deterministic,&#8221; he says. &#8220;Same input can produce different outputs.&#8221;</p><p>&#8220;I know that,&#8221; you say. &#8220;That&#8217;s why you ran ten thousand tests, right? To measure the variation?&#8221;</p><p>&#8220;Right.&#8221;</p><p>&#8220;So when we deploy this and a customer asks about a refund next month&#8212;the error rate is 0.05%. Yes or no?&#8221;</p><p>The pause is too long.</p><p>&#8220;We measured 0.05% in our testing environment,&#8221; Marcus says. &#8220;In production, it could be different.&#8221;</p><p>Sarah puts down her pen. &#8220;How different?&#8221;</p><p>&#8220;We don&#8217;t know.&#8221;</p><p>The room is very quiet.</p><p>&#8220;Explain this to me,&#8221; you say. &#8220;You ran ten thousand tests. You measured the error rate. Why can&#8217;t you tell me what it&#8217;ll be next month?&#8221;</p><p>&#8220;Because,&#8221; Marcus says, &#8220;we&#8217;re not sampling from a stable distribution.&#8221;</p><div><hr></div><h2>The Factory That Isn&#8217;t a Factory</h2><p>Here&#8217;s what you expect, because it&#8217;s how quality control works everywhere else:</p><p>You test a manufacturing line a hundred times. You get a 0.05% defect rate. The machinery is fixed, the process is stable, so tomorrow&#8217;s batch will also have about a 0.05% defect rate. You can measure quality by sampling because you&#8217;re sampling from something stable.</p><p>That&#8217;s not how LLMs work.</p><p>&#8220;Think of it like this,&#8221; the engineer says. &#8220;When we run the model, we&#8217;re not running it on some fixed machine. We&#8217;re sending requests to a server, and that server is batching our request with other requests, and how those requests get batched affects how the GPU computes things.&#8221;</p><p>&#8220;I don&#8217;t follow,&#8221; you say.</p><p>&#8220;The exact same prompt, sent to the exact same model, can produce slightly different outputs depending on what else is happening on the server at that moment. Batch size changes. GPU kernel configuration changes. The floating-point math gets computed in a different order. Most of the time it&#8217;s meaningless. But sometimes it&#8217;s enough to change a word or two.&#8221;</p><p>&#8220;So it&#8217;s random?&#8221;</p><p>&#8220;Not exactly. It&#8217;s deterministic given the exact infrastructure state. But we can&#8217;t control infrastructure state. Server load varies. Batching varies. Engineers call this &#8216;output drift&#8217;&#8212;from our perspective, it looks non-deterministic.&#8221;</p><p>You&#8217;re beginning to see it. &#8220;So when you tested it ten thousand times&#8212;&#8221;</p><p>&#8220;We measured how it behaved under those specific server conditions, at that moment in time.&#8221;</p><p>&#8220;And next month?&#8221;</p><p>&#8220;Different server load. Different batching. The underlying distribution of responses could shift.&#8221;</p><p>Sarah is writing something down. &#8220;How much could it shift?&#8221;</p><p>&#8220;We don&#8217;t know,&#8221; Marcus admits. &#8220;A recent study ran the exact same prompt through a large language model a thousand times&#8212;with temperature set to zero, telling the model to be less creative, more deterministic. It still produced eighty different completions.&#8221; He pauses. &#8220;Maybe our error rate stays around 0.05%. Maybe it drifts to 0.1%. Maybe under certain server conditions it&#8217;s higher.&#8221;</p><p>&#8220;How would we even know if it drifted?&#8221;</p><p>&#8220;Continuous monitoring. Log everything, flag anything that looks wrong, investigate patterns.&#8221;</p><p>&#8220;So we&#8217;d find out,&#8221; you say slowly, &#8220;by waiting to see if customers complain?&#8221;</p><p>Marcus doesn&#8217;t answer. He doesn&#8217;t need to.</p><div><hr></div><h2>The Judge Who Needs a Judge</h2><p>&#8220;What if,&#8221; Sarah says, &#8220;we add a second AI to check the first one? The customer-facing bot responds, then a safety bot reviews it before we send it. Like having two sets of eyes.&#8221;</p><p>The engineer nods. &#8220;That&#8217;s actually common practice. A lot of companies do this. You can use one LLM to generate responses and another to check for policy violations.&#8221;</p><p>&#8220;Would that work?&#8221;</p><p>&#8220;It helps. Catches a lot of issues.&#8221;</p><p>Sarah waits. &#8220;But?&#8221;</p><p>&#8220;But the judge is also an LLM. Which means it&#8217;s also non-deterministic.&#8221;</p><p>You laugh, but it&#8217;s not funny. &#8220;So the thing checking for consistency... isn&#8217;t consistent?&#8221;</p><p>&#8220;Right. Most of the time it catches problems. Sometimes it misses them. Sometimes it flags things that are actually fine.&#8221;</p><p>&#8220;And we can&#8217;t test our way to certainty because&#8212;&#8221;</p><p>&#8220;Because we&#8217;re still sampling from an unstable distribution. Both the worker and the supervisor can behave differently depending on server conditions.&#8221;</p><p>Sarah leans back. &#8220;So what you&#8217;re telling me is that we can&#8217;t actually guarantee this system won&#8217;t promise an unauthorized refund.&#8221;</p><p>&#8220;We can make it really unlikely,&#8221; Marcus says. &#8220;Multiple checks, continuous monitoring, human escalation for edge cases. We can build layers of protection.&#8221;</p><p>&#8220;But we can&#8217;t guarantee it.&#8221;</p><p>&#8220;No.&#8221;</p><p>You sit back in your chair. Your company&#8217;s growth has been built on trust. Customers trust you&#8217;ll treat them fairly. And what you&#8217;re learning is that the system you were about to deploy&#8212;the one that was going to help you scale that trust&#8212;is fundamentally unpredictable in ways you can&#8217;t control.</p><p>&#8220;Is anyone working on this?&#8221; you ask. &#8220;Like, is this a known problem?&#8221;</p><p>The engineer pulls up something on her laptop. &#8220;Yeah, there&#8217;s research happening. ThinkingMachines Lab published something recently about <a href="https://thinkingmachines.ai/blog/defeating-nondeterminism-in-llm-inference/">defeating non-determinism in LLM inference</a>. They identified that the main culprit is batch-size invariance&#8212;how requests get batched affects the math, which affects outputs.&#8221;</p><p>&#8220;Can it be fixed?&#8221;</p><p>&#8220;Technically, yes. You can build inference engines that are deterministic&#8212;same input produces identical output every time, regardless of server conditions.&#8221;</p><p>&#8220;So we just use that?&#8221;</p><p>&#8220;It comes with performance tradeoffs. Slower, more expensive. And it&#8217;s not widely deployed yet. Most production LLM APIs are non-deterministic by default.&#8221;</p><p>You feel something shift in the room. &#8220;Wait. So every company deploying AI right now&#8212;everyone using OpenAI, Anthropic, Google&#8212;they&#8217;re all dealing with this?&#8221;</p><p>&#8220;Yes,&#8221; the engineer says. &#8220;All the major providers explicitly note it in their documentation. Anthropic, Google&#8212;same disclaimers. Some variation is always possible.&#8221;</p><p>&#8220;Even at temperature zero.&#8221;</p><p>&#8220;Even at temperature zero.&#8221;</p><p>You look around the room. Your team has built something impressive. It works most of the time. But &#8220;most of the time&#8221; isn&#8217;t a standard you can hang a compliance program on.</p><div><hr></div><h2>The TSA Agent Problem</h2><p>Sarah breaks the silence. &#8220;You know what this reminds me of? Airport security.&#8221;</p><p>Everyone looks at her.</p><p>&#8220;Same bag, same contents, same rules. Sometimes they pull you aside to check your laptop. Sometimes they don&#8217;t. Sometimes the water bottle is fine. Sometimes it&#8217;s not. It depends who&#8217;s working that day, how busy they are, whether you look familiar.&#8221;</p><p>She&#8217;s right. You&#8217;ve been through the same airport dozens of times. The experience is never quite the same.</p><p>&#8220;TSA knows this,&#8221; she continues. &#8220;That&#8217;s why they have supervisors. Random audits. Layers of redundancy. They&#8217;ve built an entire system around the fact that humans are inconsistent.&#8221;</p><p>&#8220;So we build the same thing for AI,&#8221; you say.</p><p>&#8220;Maybe. But here&#8217;s what&#8217;s bothering me.&#8221; She opens her laptop again. &#8220;We expected humans to be inconsistent. That&#8217;s why we built all those verification systems&#8212;managers, auditors, separation of duties. We knew we couldn&#8217;t guarantee perfect human behavior, so we designed systems that work despite imperfect humans.&#8221;</p><p>&#8220;Right.&#8221;</p><p>&#8220;But we&#8217;re deploying AI <em>because</em> we expect it to be more consistent than humans. More reliable. Less variable. That&#8217;s the promise, isn&#8217;t it? That machines follow rules perfectly?&#8221;</p><p>You see where she&#8217;s going.</p><p>&#8220;And what we&#8217;re discovering,&#8221; she says, &#8220;is that AI has human-like variability without human judgment. The TSA agent might bend the rules, but they also know when to make exceptions. When to escalate. When something feels wrong. Our AI doesn&#8217;t have that.&#8221;</p><p>Marcus leans forward. &#8220;But this is what everyone is doing. OpenAI, Anthropic, Google&#8212;they&#8217;re all shipping products with this limitation. The research is happening. <a href="https://thinkingmachines.ai/blog/defeating-nondeterminism-in-llm-inference/">ThinkingMachines</a> and others are working on deterministic inference. It&#8217;ll get better.&#8221;</p><p>&#8220;When?&#8221; you ask.</p><p>&#8220;Eventually. But not today.&#8221; He pauses. &#8220;Look, we can make it really unlikely something goes wrong. Multiple checks, monitoring, human escalation for edge cases. Everyone deploying AI right now is managing this same uncertainty.&#8221;</p><p>Sarah closes her laptop. &#8220;That&#8217;s not reassuring.&#8221;</p><p>Marcus turns to you. &#8220;So what do we do? Put the project on hold until someone solves non-determinism? That could be years. Our competitors aren&#8217;t waiting.&#8221;</p><p>The room goes quiet. You can test this system, monitor it, add guardrails. You can make it really, really unlikely that something goes wrong.</p><p>But you can&#8217;t guarantee it won&#8217;t.</p><p>So would you proceed?</p><div><hr></div><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption"><em>Subscribe to get weekly insights on how AI actually works in production&#8212;including the parts that don&#8217;t.</em></p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p>]]></content:encoded></item><item><title><![CDATA[Brown M&Ms: Why Verifying AI Works Matters as Much as Making It Work]]></title><description><![CDATA[What Van Halen can teach us about delegating complex work]]></description><link>https://blog.boxcars.ai/p/brown-m-and-ms-why-verifying-ai-works</link><guid isPermaLink="false">https://blog.boxcars.ai/p/brown-m-and-ms-why-verifying-ai-works</guid><dc:creator><![CDATA[Tabrez Syed]]></dc:creator><pubDate>Thu, 13 Nov 2025 14:01:04 GMT</pubDate><enclosure url="https://substackcdn.com/image/fetch/$s_!GTWQ!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c648d27-2cc5-43dd-9b6e-cf8891bc063b_1024x1024.png" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://substackcdn.com/image/fetch/$s_!GTWQ!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c648d27-2cc5-43dd-9b6e-cf8891bc063b_1024x1024.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!GTWQ!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c648d27-2cc5-43dd-9b6e-cf8891bc063b_1024x1024.png 424w, https://substackcdn.com/image/fetch/$s_!GTWQ!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c648d27-2cc5-43dd-9b6e-cf8891bc063b_1024x1024.png 848w, https://substackcdn.com/image/fetch/$s_!GTWQ!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c648d27-2cc5-43dd-9b6e-cf8891bc063b_1024x1024.png 1272w, https://substackcdn.com/image/fetch/$s_!GTWQ!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c648d27-2cc5-43dd-9b6e-cf8891bc063b_1024x1024.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!GTWQ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c648d27-2cc5-43dd-9b6e-cf8891bc063b_1024x1024.png" width="1024" height="1024" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/1c648d27-2cc5-43dd-9b6e-cf8891bc063b_1024x1024.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:1024,&quot;width&quot;:1024,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:1868251,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:&quot;https://blog.boxcars.ai/i/178766837?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c648d27-2cc5-43dd-9b6e-cf8891bc063b_1024x1024.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!GTWQ!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c648d27-2cc5-43dd-9b6e-cf8891bc063b_1024x1024.png 424w, https://substackcdn.com/image/fetch/$s_!GTWQ!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c648d27-2cc5-43dd-9b6e-cf8891bc063b_1024x1024.png 848w, https://substackcdn.com/image/fetch/$s_!GTWQ!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c648d27-2cc5-43dd-9b6e-cf8891bc063b_1024x1024.png 1272w, https://substackcdn.com/image/fetch/$s_!GTWQ!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F1c648d27-2cc5-43dd-9b6e-cf8891bc063b_1024x1024.png 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a></figure></div><p>Rock stars have a reputation for absurd demands. Tabloids report Mariah Carey once asked for 20 white kittens and 100 doves, while other stars allegedly specify exact dressing-room temperatures. The stories pile up, each more ridiculous than the last, reinforcing our image of celebrity excess.</p><p>But one of the more eccentric demands comes from <a href="https://www.snopes.com/fact-check/brown-out/">Van Halen&#8217;s 1982 world tour contract</a> - &#8220;No brown M&amp;Ms in the backstage area upon pain of forfeiture of the show, with full compensation.&#8221; What kind of an aversion to brown M&amp;Ms produce a rider like that? Who demands someone go through and pull out brown M&amp;Ms?</p><div class="captioned-image-container"><figure><a class="image-link image2" target="_blank" href="https://substackcdn.com/image/fetch/$s_!O5da!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c108f6a-5257-48c6-a20a-abff4752504b_477x144.png" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://substackcdn.com/image/fetch/$s_!O5da!,w_424,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c108f6a-5257-48c6-a20a-abff4752504b_477x144.png 424w, https://substackcdn.com/image/fetch/$s_!O5da!,w_848,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c108f6a-5257-48c6-a20a-abff4752504b_477x144.png 848w, https://substackcdn.com/image/fetch/$s_!O5da!,w_1272,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c108f6a-5257-48c6-a20a-abff4752504b_477x144.png 1272w, https://substackcdn.com/image/fetch/$s_!O5da!,w_1456,c_limit,f_webp,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c108f6a-5257-48c6-a20a-abff4752504b_477x144.png 1456w" sizes="100vw"><img src="https://substackcdn.com/image/fetch/$s_!O5da!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c108f6a-5257-48c6-a20a-abff4752504b_477x144.png" width="477" height="144" data-attrs="{&quot;src&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/6c108f6a-5257-48c6-a20a-abff4752504b_477x144.png&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:144,&quot;width&quot;:477,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:46235,&quot;alt&quot;:null,&quot;title&quot;:null,&quot;type&quot;:&quot;image/png&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:false,&quot;internalRedirect&quot;:&quot;https://blog.boxcars.ai/i/178766837?img=https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c108f6a-5257-48c6-a20a-abff4752504b_477x144.png&quot;,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="" srcset="https://substackcdn.com/image/fetch/$s_!O5da!,w_424,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c108f6a-5257-48c6-a20a-abff4752504b_477x144.png 424w, https://substackcdn.com/image/fetch/$s_!O5da!,w_848,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c108f6a-5257-48c6-a20a-abff4752504b_477x144.png 848w, https://substackcdn.com/image/fetch/$s_!O5da!,w_1272,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c108f6a-5257-48c6-a20a-abff4752504b_477x144.png 1272w, https://substackcdn.com/image/fetch/$s_!O5da!,w_1456,c_limit,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F6c108f6a-5257-48c6-a20a-abff4752504b_477x144.png 1456w" sizes="100vw"></picture><div></div></div></a></figure></div><p>Then in <a href="https://www.smithsonianmag.com/arts-culture/why-did-van-halen-demand-concert-venues-remove-brown-mms-from-the-menu-180982570/">his memoir, </a><em><a href="https://www.smithsonianmag.com/arts-culture/why-did-van-halen-demand-concert-venues-remove-brown-mms-from-the-menu-180982570/">Crazy from the Heat</a></em>, lead vocalist David Lee Roth revealed what it was actually about.</p><p>Van Halen was the first band to take massive productions into tertiary markets&#8212;smaller venues that had never hosted a show this size, staffed by local crews they&#8217;d never worked with before and would likely never see again. They&#8217;d arrive with nine eighteen-wheeler trucks full of equipment, where the standard was three trucks maximum. The sheer scale created serious technical challenges that depended on dozens of local contractors and subcontractors&#8212;electricians, riggers, structural engineers&#8212;each making critical decisions Roth would never directly see.</p><p>The contract rider was massive, filled with technical specifications. Detail after detail, each one critical to keeping the crew safe and the show operational.</p><p>And then, buried in the middle of these technical specifications, Article 126: no brown M&amp;Ms.</p><p>When Roth walked backstage, if he saw even a single brown M&amp;M in that bowl, he knew instantly that they hadn&#8217;t read the contract and would call for a complete line-check of the entire production. As he later explained, &#8220;Guaranteed you&#8217;re going to arrive at a technical error. They didn&#8217;t read the contract.&#8221; Sometimes those errors were life-threatening&#8212;girders that couldn&#8217;t support the weight, flooring that would sink, structural problems that could collapse the stage.</p><p>The brown M&amp;Ms were a simple test that told Roth whether he could rely on work done by people he&#8217;d never met. If they didn&#8217;t catch the part about brown M&amp;Ms what else did they miss? When you can&#8217;t check everything yourself, you need to find your brown M&amp;Ms&#8212;one simple thing that reveals whether anyone checked anything at all.</p><h2>The Verification Gap</h2><p>We face the same challenge with AI systems today. We deploy agents to analyze documents, write code, draft contracts, generate reports. Then we stand backstage wondering: can we verify what they produced?</p><p>If verifying the work takes as much effort as checking every girder and cable yourself, delegation breaks down. Why delegate if checking the work takes just as much time as doing it yourself?</p><p>This might explain why AI coding agents have gained traction in software development. The verification infrastructure already exists. When AI suggests code, you run it to see if it works. You write tests to validate its behavior. You review it before merging. You revert it if problems emerge. The work is hard to do (writing correct code) but verification can be automated.</p><p>The software industry already handles delegation at scale. For example, consider a large software project like the Windows operating system. It requires coordinating work from people who&#8217;ve never met, spread across time zones and continents. The Windows operating system contains <a href="https://www.wired.com/2015/09/google-2-billion-lines-codeand-one-place/">approximately 50 million lines of code</a>. For Windows 8, Microsoft organized <a href="https://learn.microsoft.com/en-us/archive/blogs/b8/introducing-the-team">35 feature teams</a>, each with 25-40 developers plus test and program management&#8212;roughly a thousand people working on something no single person could comprehend in its entirety.</p><p>These developers don&#8217;t all know each other. A programmer in Redmond commits code that integrates with work from someone in Bangalore who&#8217;s collaborating with a contractor in Prague. Yet the system works because the software industry has built infrastructure for distributed trust: version control tracks every change, automated tests verify that new code doesn&#8217;t break existing functionality, code review processes catch errors before integration, continuous integration systems detect conflicts, and critically, everything can be reverted if something goes wrong.</p><p>Now contrast this with legal work or financial analysis. An AI system analyzes case law and drafts a legal argument, or processes financial documents and produces analysis. How do you verify either is correct? You&#8217;d need to check each citation, validate the reasoning, confirm the logic. The verification can take as long as doing the original work yourself. If supervising the AI takes as much effort as doing the work yourself, what&#8217;s the benefit?</p><p>The gap isn&#8217;t AI capability. The gap is verification cost. And unlike software development, these fields haven&#8217;t found their brown M&amp;Ms yet&#8212;that simple check that reveals whether the complex work was done right.</p><p>So what would those checks look like?</p><h2>Show Your Work</h2><p>The answer might be simpler than we think. My elementary school math teacher had an approach that applies here. She told us repeatedly to: &#8220;Show your work.&#8221;</p><p>When we&#8217;d turn in math homework, she didn&#8217;t just want the answer. She wanted to see how we got there. Because seeing &#8220;x = 7&#8221; told her nothing. Did we understand the concept? Did we follow the right process? Or did we guess and get lucky?</p><p>When the answer was wrong, &#8220;show your work&#8221; let her identify exactly where our thinking went astray. Maybe we understood the concept but made an arithmetic error. Maybe we set up the equation wrong from the start. The work itself was the diagnostic.</p><p>The Hitchhiker&#8217;s Guide to the Galaxy has a famous joke about this. A supercomputer named Deep Thought spends 7.5 million years calculating the Answer to the Ultimate Question of Life, the Universe, and Everything. Finally, it announces: &#8220;Forty-two.&#8221;</p><p>The joke is that the answer is meaningless without understanding the question. But there&#8217;s a deeper problem: even if we knew the question, &#8220;42&#8221; tells us nothing about how Deep Thought arrived at that answer. We can&#8217;t verify its reasoning. We can&#8217;t check its work. We can&#8217;t identify where it might have gone wrong. We just have to trust that after 7.5 million years of computation, it got it right.</p><p>This is the problem with integrating AI outputs today. They give us the answer without an easy way of reviewing the work.</p><p>But what does &#8220;show your work&#8221; look like when the work is complex cognitive analysis rather than simple arithmetic?</p><h2>Designing for Verification</h2><p>I&#8217;ve been wrestling with this question while building an AI agent that processes company financial documents and analyzes them. This routine work could save human financial analysts hours of work.</p><p>But presenting just the final analysis recreates the Deep Thought problem. Here&#8217;s the insight you were looking for! But how did we get here? What assumptions did we make? Which documents did we pull these numbers from? The human reviewing the analysis would need to reverify everything, which defeats the purpose.</p><p>The solution was to make the system output its work the same way a human analyst would: spreadsheets with exposed formulas that professionals already know how to read. They can trace calculations backward, spot-check assumptions, modify inputs to test scenarios. But more importantly, the system includes a diagnostic layer&#8212;automated checks that surface whether source documents processed correctly, whether totals reconcile, whether there are calculation anomalies.</p><p>This shifts verification from &#8220;check everything or trust nothing&#8221; to &#8220;review diagnostics, spot-check anomalies.&#8221; The human doesn&#8217;t need to reverify every calculation. They glance at the diagnostic checks&#8212;green or red&#8212;then investigate only when something flags. Hours of verification work becomes minutes.</p><p>I&#8217;d found my brown M&amp;Ms for financial analysis: those diagnostic checks. If they pass, the work is probably sound. If they don&#8217;t, I know exactly where to look.</p><p>This is one implementation of &#8220;show your work,&#8221; but the principle applies everywhere AI does complex cognitive tasks.</p><p>Which raises a larger question: why is every team building these verification systems from scratch?</p><h2>The Missing Infrastructure</h2><p>I spent weeks designing these Excel structures and diagnostic checks for one specific use case&#8212;financial document analysis. A legal team would need to build something completely different. A medical team would need something else entirely. Every domain solving the same fundamental problem independently.</p><p>This felt familiar. Before Git became standard, software teams had version control tools, but collaborating with large teams was still painful. People developed custom workflows and processes to work around the limitations. Then Git arrived with both better tooling and new ways of working. But it wasn&#8217;t automatic&#8212;developers had to learn how to branch properly, how to merge effectively, how to use the infrastructure.</p><p>That&#8217;s where we are now with AI in other domains.</p><p>What&#8217;s the Git for lawyers working with documents? For financial analysts collaborating on Excel models? These tools aren&#8217;t great for team collaboration even without AI in the picture. Adding AI to the mix won&#8217;t make verification easier unless both the tooling improves and people learn to use it properly.</p><p>Software development got lucky. The verification infrastructure existed before AI arrived. Other domains are building theirs now, one custom solution at a time.</p><p>Roth didn&#8217;t need to understand electrical systems or structural engineering. He just needed to walk backstage and glance at a bowl of M&amp;Ms. That single check gave him a hint about the quality of the work.</p><p>Every field adopting AI needs to find its brown M&amp;Ms&#8212;the checks that reveals whether the complex work was done right. Not systems that never make mistakes, but verification so simple that catching mistakes becomes easy and routine.</p><p>The question isn&#8217;t whether AI can do the work. It&#8217;s whether we can verify it did the work correctly without doing it ourselves.</p><p>What are your brown M&amp;Ms?</p><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption">Subscribe to get weekly insights on the real challenges of deploying AI&#8212;from verification gaps to infrastructure needs</p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p>]]></content:encoded></item><item><title><![CDATA[Why AI Doesn’t Need to Work Perfectly to Win]]></title><description><![CDATA[The lesson from 1929: When technology unlocks impossible capabilities, adoption doesn&#8217;t wait for reliability&#8212;it happens when something impossible becomes merely unreliable.]]></description><link>https://blog.boxcars.ai/p/why-ai-doesnt-need-to-work-perfectly</link><guid isPermaLink="false">https://blog.boxcars.ai/p/why-ai-doesnt-need-to-work-perfectly</guid><dc:creator><![CDATA[Tabrez Syed]]></dc:creator><pubDate>Thu, 06 Nov 2025 14:03:26 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1726594200589-4d0a4cc47bc3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8b2xkJTIwdGVsZXBob25lfGVufDB8fHx8MTc2MjQxMTkwNHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1726594200589-4d0a4cc47bc3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8b2xkJTIwdGVsZXBob25lfGVufDB8fHx8MTc2MjQxMTkwNHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1726594200589-4d0a4cc47bc3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8b2xkJTIwdGVsZXBob25lfGVufDB8fHx8MTc2MjQxMTkwNHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1726594200589-4d0a4cc47bc3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8b2xkJTIwdGVsZXBob25lfGVufDB8fHx8MTc2MjQxMTkwNHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1726594200589-4d0a4cc47bc3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8b2xkJTIwdGVsZXBob25lfGVufDB8fHx8MTc2MjQxMTkwNHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1726594200589-4d0a4cc47bc3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8b2xkJTIwdGVsZXBob25lfGVufDB8fHx8MTc2MjQxMTkwNHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1726594200589-4d0a4cc47bc3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8b2xkJTIwdGVsZXBob25lfGVufDB8fHx8MTc2MjQxMTkwNHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" width="3840" height="2160" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1726594200589-4d0a4cc47bc3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8b2xkJTIwdGVsZXBob25lfGVufDB8fHx8MTc2MjQxMTkwNHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:2160,&quot;width&quot;:3840,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;An old fashioned phone is on a wooden stand&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="An old fashioned phone is on a wooden stand" title="An old fashioned phone is on a wooden stand" srcset="https://images.unsplash.com/photo-1726594200589-4d0a4cc47bc3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8b2xkJTIwdGVsZXBob25lfGVufDB8fHx8MTc2MjQxMTkwNHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1726594200589-4d0a4cc47bc3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8b2xkJTIwdGVsZXBob25lfGVufDB8fHx8MTc2MjQxMTkwNHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1726594200589-4d0a4cc47bc3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8b2xkJTIwdGVsZXBob25lfGVufDB8fHx8MTc2MjQxMTkwNHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1726594200589-4d0a4cc47bc3?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxMnx8b2xkJTIwdGVsZXBob25lfGVufDB8fHx8MTc2MjQxMTkwNHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption">Photo by <a href="https://unsplash.com/@carlos3dart">Carlos Eduardo</a> on <a href="https://unsplash.com">Unsplash</a></figcaption></figure></div><p>An article titled <a href="https://nearlyright.com/silicon-valleys-ai-agents-cant-schedule-meetings-but-promise-to-replace-workers-by-2027/">&#8220;AI Agents can&#8217;t schedule meetings but promise to replace workers&#8221;</a> has been making the rounds recently. In it, the author claims GPT-4o failed most basic office tasks in their test. And sixteen years and billions of dollars later, self-driving cars operate in a handful of cities under limited conditions.</p><p>The takeaway: AI agents can&#8217;t schedule meetings how will they take away jobs? There are many forms of this reliability argument I see floating around.</p><p>The numbers are sound and the logic feels air-tight.</p><p>But something about the argument feels off.</p><p>The reliability critique assumes technology succeeds by being better at existing tasks. If it can&#8217;t match or exceed current reliability standards, it&#8217;s not ready for adoption.</p><p>This seems obvious. But it&#8217;s not the whole story.</p><p>To understand why, we need to look at how technology actually gets adopted&#8212;not how we think it should.</p><p>Early technology is never as reliable as what it replaces. But that&#8217;s not the barrier to adoption we think it is. When something unlocks a capability that didn&#8217;t exist before, reliability becomes secondary. Sometimes a 30% success rate at something we couldn&#8217;t do before matters more than a 99% success rate at something that we already do. Innovation scholars from Everett Rogers to Clayton Christensen have documented this pattern: early technologies rarely win by outperforming incumbents&#8212;they win by redefining what &#8220;performance&#8221; means. History has many stories about this pattern, let&#8217;s look at a couple.</p><h2>Fast But Fragile Beats Slow But Safe</h2><p>In 1929, if you needed to send an urgent contract from New York to San Francisco, you had one option that worked: the railroad. Your letter would travel in a mail car, sorted and handled by postal workers who had refined their systems over decades. The journey took five days. But it worked. Mail arrived reliably, predictably, intact. The railroad companies had spent half a century perfecting this system.</p><p>Then the airmail service launched.</p><p>The first planes were modified military aircraft left over from World War I. They were temperamental machines that required constant maintenance. Weather grounded them regularly. Mechanical failures were common. And sometimes, they crashed.</p><p>According to USPS historical archives, in 1929 alone, <a href="https://safetycompass.wordpress.com/2023/11/27/how-tragedy-led-to-trust-national-aviation-history-month/">fifty-one airmail planes went down</a>. <a href="https://about.usps.com/who-we-are/postal-history/airmail.pdf">Nearly three dozen pilots had died in the previous decade</a> trying to deliver mail by air. If you sent your urgent contract by airmail, you faced a chance your letter would burn up in a crash somewhere over the heartland.</p><p><a href="https://info.mysticstamp.com/transcontinental-airmail_tdih/">The flying conditions were brutal</a>. Pilots flew exposed biplanes left over from World War I&#8212;not fully enclosed cockpits, just open to cold rain and wind. Hot engine oil constantly splattered their goggles. They flew barely 50 feet off the ground so they could see railroad stations and polo fields to stay on course. One pilot who flew the demonstration route in 1921 drank coffee and stuffed newspaper in his jacket for warmth before continuing through near-crashes in the dark.</p><p>Business leaders knew these numbers. The contrast was stark: trains had crossed the continent reliably for half a century. The railroad system worked. Why would anyone risk an important document on such dangerous technology?</p><p>Yet businesses kept paying premium prices to send their most important documents by air.</p><p>The math was simple. <a href="https://info.mysticstamp.com/transcontinental-airmail_tdih/">Trains took 108 hours coast-to-coast</a>. Airmail took 33 hours. For time-sensitive documents, one day of delivery at 70% reliability beat four-and-a-half days at 99% reliability. A contract that arrived in one day could close a deal before competitors even knew about it. A legal filing that arrived in one day could meet a deadline that four days would miss.</p><p>Speed had unlocked a capability that didn&#8217;t exist before. And that new capability was valuable enough to tolerate unreliability.</p><h2>When Something Beats Nothing</h2><p>The business world was unconvinced. As late as 1879, the Chief Engineer of the British Post Office declared that &#8220;The Americans have need of the telephone, but we do not. We have plenty of messenger boys.&#8221; The telegraph system worked reliably, with clear printed messages that left no room for mishearing or misunderstanding.</p><p>But the skeptics weren&#8217;t wrong about the telephone&#8217;s shortcomings.</p><p>Early telephone users described the experience as one of <a href="https://journal.sciencemuseum.ac.uk/browse/issue-03/troublesome-telephony">&#8220;feebleness and uncertainty.&#8221;</a> The carbon granule microphones created scratchy, harsh sounds. Interference from nearby telegraph wires and electrical currents would nearly drown out the speaker&#8217;s voice. Weather created static. Long distances created echo. Call quality was so poor that one 1880 testimonial warned potential users: &#8220;strangers hearing through it for the first time may find themselves on that account disappointed.&#8221;</p><p>But telegraph service worked perfectly. Messages arrived intact, properly formatted, readable. You could send a telegram at 2 AM and know it would be delivered first thing in the morning. The system had been refined over decades. Why would anyone switch to a technology where you had to shout &#8220;Hello? Hello?&#8221; multiple times just to establish that someone was on the other end?</p><p>Yet within two years of Bell&#8217;s patent, the <a href="https://en.wikipedia.org/wiki/History_of_the_telephone">first commercial telephone exchange opened in New Haven, Connecticut</a> with 21 subscribers. By 1880, <a href="https://www.ithacajournal.com/story/news/local/2017/10/05/early-years-telephone-ithaca/735978001/">Ithaca, New York had 100 telephone subscribers</a>&#8212;described as &#8220;a larger number than has been obtained in so short a time in places even of twice the size.&#8221;</p><p>The telegraph could do many things better than the telephone. But it couldn&#8217;t do one thing at all: real-time back-and-forth conversation.</p><p>If you needed to negotiate a deal, telegraph required sending a message, waiting for a response, sending another message, waiting again. Each round trip took hours. A simple negotiation could stretch over days. The telephone, even with its terrible audio quality, let you have that entire conversation in minutes. You could hear hesitation in someone&#8217;s voice. You could clarify misunderstandings immediately. You could close deals while your competitors were still composing their first telegram.</p><p>The dimension that mattered wasn&#8217;t audio fidelity. It was synchronicity. And synchronous voice communication at 30% reliability beat asynchronous text communication at 99% reliability for any task that required real-time interaction.</p><div class="captioned-button-wrap" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/p/why-ai-doesnt-need-to-work-perfectly?utm_source=substack&utm_medium=email&utm_content=share&action=share&quot;,&quot;text&quot;:&quot;Share&quot;}" data-component-name="CaptionedButtonToDOM"><div class="preamble"><p class="cta-caption"><em>Found this perspective valuable? <a href="https://blog.boxcars.ai/p/beyond-reliability">Share it</a> with someone debating whether AI is overhyped or about to change everything&#8212;the answer might be both.</em></p></div><p class="button-wrapper" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/p/why-ai-doesnt-need-to-work-perfectly?utm_source=substack&utm_medium=email&utm_content=share&action=share&quot;,&quot;text&quot;:&quot;Share&quot;}" data-component-name="ButtonCreateButton"><a class="button primary" href="https://blog.boxcars.ai/p/why-ai-doesnt-need-to-work-perfectly?utm_source=substack&utm_medium=email&utm_content=share&action=share"><span>Share</span></a></p></div><h2>The Pattern Continues</h2><p>This same dynamic plays out today, though we often miss it while focusing on reliability metrics.</p><p>I tried Apple&#8217;s <a href="https://www.apple.com/newsroom/2025/09/introducing-airpods-pro-3-the-ultimate-audio-experience/">new Live Translation feature</a> last month. You press both AirPod stems simultaneously and it activates real-time translation for in-person conversations. The feature launched in September 2025 with support for nine languages, processing everything on-device for privacy.</p><p>It&#8217;s laggy. The translations arrive a half-second behind the speaker, creating this awkward pause in conversation. Sometimes it misses words entirely. The accuracy isn&#8217;t perfect&#8212;nuance gets lost, idioms get mangled. If you tried to conduct diplomatic negotiations or close a complex business deal through it, you&#8217;d probably fail.</p><p>But here&#8217;s what it does do: it lets you have a conversation with someone whose language you don&#8217;t speak. Not a polished, perfectly understood conversation. A halting, imperfect, occasionally confusing conversation. But a conversation nonetheless.</p><p>Before this technology, what were your options? Hand signals. Translation apps where you type, wait, show your phone, wait for them to type, show their phone back. Maybe a professional translator if you planned ahead and could afford it. For spontaneous interactions&#8212;asking directions, ordering food, having an unplanned conversation with a neighbor&#8212;you had nothing.</p><p>The AirPods translation feature isn&#8217;t replacing professional translators. It&#8217;s not good enough for important negotiations or medical consultations. But for the thousands of small interactions where the alternative was frustration and miscommunication? Even at 70% accuracy with noticeable lag, it beats 0% capability.</p><p>The reliability critics would point out&#8212;correctly&#8212;that it fails too often for serious use. But they&#8217;re measuring the wrong dimension. The question isn&#8217;t &#8220;Is it as reliable as a professional translator?&#8221; The question is &#8220;Does it unlock conversations that couldn&#8217;t happen before?&#8221;</p><p>Same pattern as airmail. Same pattern as the telephone. Technology doesn&#8217;t win by being more reliable than existing solutions. It wins by making things possible.</p><h2>The Question That Matters</h2><p>The reliability critics are right about the numbers. AI agents do fail basic tasks. Self-driving cars do require perfect conditions.</p><p>But that&#8217;s not the question that determines adoption.</p><p>The question is: what dimension does AI unlock that didn&#8217;t exist before?</p><p>The pattern from 1929 still holds: when technology unlocks an impossible dimension, we tolerate unreliability. When it only promises to do existing tasks better, reliability matters enormously. For safety-critical systems&#8212;medical devices, aviation, autonomous vehicles&#8212;the bar is appropriately high. But even there, driver assistance features arrive before full autonomy, providing new capabilities while the technology improves.</p><p>So the next time someone shows you statistics about AI failure rates, ask yourself: what dimension is this trying to unlock? If it&#8217;s trying to replace something that already works, the reliability bar is high. But if it&#8217;s trying to make something possible that wasn&#8217;t before&#8212;even with significant failures&#8212;the math might work out differently than the skeptics think.</p><p>The future of AI may not look like perfect autonomous systems replacing human workers. It will look like imperfect tools unlocking capabilities we didn&#8217;t have, with humans adapting their workflows around what the technology can actually do. Just like businesses in 1929 learned to send documents both by air and train. Just like early telephone users learned to shout &#8220;Hello?&#8221; until someone answered.</p><p>Reliability will improve over time. But adoption doesn&#8217;t wait for reliability. It happens when something impossible becomes merely unreliable. And right now, AI is making a lot of impossible things merely unreliable. Real-time language translation, code generation, content creation, complex analysis&#8212;tasks that previously required specialized expertise or were simply too resource-intensive to attempt. We tolerate their unreliability because the alternative was having no capability at all.</p><p>The railroad worked perfectly too. That&#8217;s not what mattered.</p><div><hr></div><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption"><em>Don&#8217;t miss weekly insights on how AI is reshaping work&#8212;<a href="https://blog.boxcars.ai/">subscribe</a> to stay ahead of what&#8217;s actually happening, not just what&#8217;s hyped.</em></p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p><p>Related:</p><div class="digest-post-embed" data-attrs="{&quot;nodeId&quot;:&quot;84827c93-99ea-4afb-bf73-0495543a6ca4&quot;,&quot;caption&quot;:&quot;Change is messy. When companies roll out major new initiatives like reorganizations, IT system changes, or process redesigns, employees get swept away on an emotional rollercoaster ride. In the 1970s, psychologists Don Kelley and Daryl Conner coined this bumpy track, the&quot;,&quot;cta&quot;:&quot;Read full story&quot;,&quot;showBylines&quot;:true,&quot;size&quot;:&quot;md&quot;,&quot;isEditorNode&quot;:true,&quot;title&quot;:&quot;The Rollercoaster Ride of AI: Hype, Hope, and Reality&quot;,&quot;publishedBylines&quot;:[{&quot;id&quot;:130480501,&quot;name&quot;:&quot;Tabrez Syed&quot;,&quot;bio&quot;:&quot;Programmer turned product manager. Now working on rethinking apps in a world of AI.&quot;,&quot;photo_url&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/4c5a7001-14b2-4bd4-b916-b853eb8381fd_3000x3918.jpeg&quot;,&quot;is_guest&quot;:false,&quot;bestseller_tier&quot;:null}],&quot;post_date&quot;:&quot;2023-09-07T13:00:14.439Z&quot;,&quot;cover_image&quot;:&quot;https://substackcdn.com/image/fetch/$s_!QptH!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F19719c22-d9d7-4dce-bbd2-82913edada1f_800x600.jpeg&quot;,&quot;cover_image_alt&quot;:null,&quot;canonical_url&quot;:&quot;https://blog.boxcars.ai/p/the-rollercoaster-ride-of-ai-hype&quot;,&quot;section_name&quot;:null,&quot;video_upload_id&quot;:null,&quot;id&quot;:136813577,&quot;type&quot;:&quot;newsletter&quot;,&quot;reaction_count&quot;:0,&quot;comment_count&quot;:0,&quot;publication_id&quot;:1438382,&quot;publication_name&quot;:&quot;BoxCars AI&quot;,&quot;publication_logo_url&quot;:&quot;https://substackcdn.com/image/fetch/$s_!lhIv!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa43b3a40-40f4-4f9d-b843-b52a17a80bb9_1024x1024.png&quot;,&quot;belowTheFold&quot;:true,&quot;youtube_url&quot;:null,&quot;show_links&quot;:null,&quot;feed_url&quot;:null}"></div><div class="digest-post-embed" data-attrs="{&quot;nodeId&quot;:&quot;93720f3e-59f5-4452-b708-044ba64117a4&quot;,&quot;caption&quot;:&quot;As a startup founder, two quotes have deeply influenced my perspective on technology and innovation. The first comes from sci-fi writer Arthur C. Clarke:&quot;,&quot;cta&quot;:&quot;Read full story&quot;,&quot;showBylines&quot;:true,&quot;size&quot;:&quot;md&quot;,&quot;isEditorNode&quot;:true,&quot;title&quot;:&quot;Everyday Magic: How Groundbreaking Technology Becomes Commonplace&quot;,&quot;publishedBylines&quot;:[{&quot;id&quot;:130480501,&quot;name&quot;:&quot;Tabrez Syed&quot;,&quot;bio&quot;:&quot;Programmer turned product manager. Now working on rethinking apps in a world of AI.&quot;,&quot;photo_url&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/4c5a7001-14b2-4bd4-b916-b853eb8381fd_3000x3918.jpeg&quot;,&quot;is_guest&quot;:false,&quot;bestseller_tier&quot;:null}],&quot;post_date&quot;:&quot;2023-09-28T13:00:31.702Z&quot;,&quot;cover_image&quot;:&quot;https://images.unsplash.com/photo-1584956552999-65adccdbf18f?ixlib=rb-4.0.3&amp;ixid=M3wxMjA3fDB8MHxwaG90by1wYWdlfHx8fGVufDB8fHx8fA%3D%3D&amp;auto=format&amp;fit=crop&amp;w=1000&amp;q=80&quot;,&quot;cover_image_alt&quot;:null,&quot;canonical_url&quot;:&quot;https://blog.boxcars.ai/p/everyday-magic-how-groundbreaking&quot;,&quot;section_name&quot;:null,&quot;video_upload_id&quot;:null,&quot;id&quot;:137452526,&quot;type&quot;:&quot;newsletter&quot;,&quot;reaction_count&quot;:0,&quot;comment_count&quot;:0,&quot;publication_id&quot;:1438382,&quot;publication_name&quot;:&quot;BoxCars AI&quot;,&quot;publication_logo_url&quot;:&quot;https://substackcdn.com/image/fetch/$s_!lhIv!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa43b3a40-40f4-4f9d-b843-b52a17a80bb9_1024x1024.png&quot;,&quot;belowTheFold&quot;:true,&quot;youtube_url&quot;:null,&quot;show_links&quot;:null,&quot;feed_url&quot;:null}"></div>]]></content:encoded></item><item><title><![CDATA[The Human Sub-Routine]]></title><description><![CDATA[How &#8220;human-in-the-loop&#8221; might have the loop backwards]]></description><link>https://blog.boxcars.ai/p/the-human-sub-routine</link><guid isPermaLink="false">https://blog.boxcars.ai/p/the-human-sub-routine</guid><dc:creator><![CDATA[Tabrez Syed]]></dc:creator><pubDate>Thu, 30 Oct 2025 13:02:03 GMT</pubDate><enclosure url="https://images.unsplash.com/photo-1590278458425-6aa3912a48a5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxtYXplfGVufDB8fHx8MTc2MTcxNjc4OHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" length="0" type="image/jpeg"/><content:encoded><![CDATA[<div class="captioned-image-container"><figure><a class="image-link image2 is-viewable-img" target="_blank" href="https://images.unsplash.com/photo-1590278458425-6aa3912a48a5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxtYXplfGVufDB8fHx8MTc2MTcxNjc4OHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" data-component-name="Image2ToDOM"><div class="image2-inset"><picture><source type="image/webp" srcset="https://images.unsplash.com/photo-1590278458425-6aa3912a48a5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxtYXplfGVufDB8fHx8MTc2MTcxNjc4OHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1590278458425-6aa3912a48a5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxtYXplfGVufDB8fHx8MTc2MTcxNjc4OHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1590278458425-6aa3912a48a5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxtYXplfGVufDB8fHx8MTc2MTcxNjc4OHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1590278458425-6aa3912a48a5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxtYXplfGVufDB8fHx8MTc2MTcxNjc4OHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw"><img src="https://images.unsplash.com/photo-1590278458425-6aa3912a48a5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxtYXplfGVufDB8fHx8MTc2MTcxNjc4OHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080" width="4000" height="2672" data-attrs="{&quot;src&quot;:&quot;https://images.unsplash.com/photo-1590278458425-6aa3912a48a5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxtYXplfGVufDB8fHx8MTc2MTcxNjc4OHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080&quot;,&quot;srcNoWatermark&quot;:null,&quot;fullscreen&quot;:null,&quot;imageSize&quot;:null,&quot;height&quot;:2672,&quot;width&quot;:4000,&quot;resizeWidth&quot;:null,&quot;bytes&quot;:null,&quot;alt&quot;:&quot;people sitting on white concrete stairs&quot;,&quot;title&quot;:null,&quot;type&quot;:&quot;image/jpg&quot;,&quot;href&quot;:null,&quot;belowTheFold&quot;:false,&quot;topImage&quot;:true,&quot;internalRedirect&quot;:null,&quot;isProcessing&quot;:false,&quot;align&quot;:null,&quot;offset&quot;:false}" class="sizing-normal" alt="people sitting on white concrete stairs" title="people sitting on white concrete stairs" srcset="https://images.unsplash.com/photo-1590278458425-6aa3912a48a5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxtYXplfGVufDB8fHx8MTc2MTcxNjc4OHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 424w, https://images.unsplash.com/photo-1590278458425-6aa3912a48a5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxtYXplfGVufDB8fHx8MTc2MTcxNjc4OHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 848w, https://images.unsplash.com/photo-1590278458425-6aa3912a48a5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxtYXplfGVufDB8fHx8MTc2MTcxNjc4OHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1272w, https://images.unsplash.com/photo-1590278458425-6aa3912a48a5?crop=entropy&amp;cs=tinysrgb&amp;fit=max&amp;fm=jpg&amp;ixid=M3wzMDAzMzh8MHwxfHNlYXJjaHwxfHxtYXplfGVufDB8fHx8MTc2MTcxNjc4OHww&amp;ixlib=rb-4.1.0&amp;q=80&amp;w=1080 1456w" sizes="100vw" fetchpriority="high"></picture><div class="image-link-expand"><div class="pencraft pc-display-flex pc-gap-8 pc-reset"><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container restack-image"><svg role="img" width="20" height="20" viewBox="0 0 20 20" fill="none" stroke-width="1.5" stroke="var(--color-fg-primary)" stroke-linecap="round" stroke-linejoin="round" xmlns="http://www.w3.org/2000/svg"><g><title></title><path d="M2.53001 7.81595C3.49179 4.73911 6.43281 2.5 9.91173 2.5C13.1684 2.5 15.9537 4.46214 17.0852 7.23684L17.6179 8.67647M17.6179 8.67647L18.5002 4.26471M17.6179 8.67647L13.6473 6.91176M17.4995 12.1841C16.5378 15.2609 13.5967 17.5 10.1178 17.5C6.86118 17.5 4.07589 15.5379 2.94432 12.7632L2.41165 11.3235M2.41165 11.3235L1.5293 15.7353M2.41165 11.3235L6.38224 13.0882"></path></g></svg></button><button tabindex="0" type="button" class="pencraft pc-reset pencraft icon-container view-image"><svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" viewBox="0 0 24 24" fill="none" stroke="currentColor" stroke-width="2" stroke-linecap="round" stroke-linejoin="round" class="lucide lucide-maximize2 lucide-maximize-2"><polyline points="15 3 21 3 21 9"></polyline><polyline points="9 21 3 21 3 15"></polyline><line x1="21" x2="14" y1="3" y2="10"></line><line x1="3" x2="10" y1="21" y2="14"></line></svg></button></div></div></div></a><figcaption class="image-caption">Photo by <a href="https://unsplash.com/@syinq">Susan Q Yin</a> on <a href="https://unsplash.com">Unsplash</a></figcaption></figure></div><p>They call it &#8220;human-in-the-loop&#8221;&#8212;the idea that AI systems will handle execution while humans provide oversight and judgment. Ethan Mollick calls it &#8220;cyborg management.&#8221; Sam Altman talks about giving everyone a personal AI team. The promise is elegant: machines do the work, humans make the decisions.</p><p>Over two years ago, when I started using AI for programming, I was clearly the one in the loop. I&#8217;d copy code from ChatGPT, paste it into my editor, read it line by line. The AI was a suggestion engine. I was the gatekeeper&#8212;code didn&#8217;t exist in my project until I understood it and approved it.</p><p>Then I started using Cline, an AI coding agent that runs inside VS Code. The workflow changed. Cline would propose file changes, show me diffs, wait for my approval. I&#8217;d review each change, sometimes reject it, sometimes accept it. It felt like collaboration. The AI would suggest, I would decide. I was supervising.</p><p>I&#8217;ve now switched to OpenAI Codex as my daily driver. The workflow has changed again. Now the AI tells me it made an edit (<em>past tense</em>). &#8220;I&#8217;ve updated the authentication flow.&#8221; The changes are already implemented. I can click to review them, but they&#8217;re often so extensive&#8212;hundreds of lines changed&#8212;that I find myself asking the AI to explain what it just did.</p><p>I&#8217;m not approving changes anymore. I&#8217;m getting status updates.</p><p>I tell myself I&#8217;m still supervising. But supervision requires understanding. And increasingly, the changes are too big, too fast, too complex for me to understand without asking the AI to teach me about its own work. When something breaks, I don&#8217;t debug it myself&#8212;I ask it to fix its own code.</p><p>The AI writes code, explains what it wrote, then continues coding while I nod along.</p><p>I&#8217;m not directing the work anymore. I&#8217;m the notification step in someone else&#8217;s workflow.</p><p>Each phase felt like an upgrade. Copy-pasting was tedious. Having Cline propose changes was more efficient. Having Codex just do the work is even faster. But somewhere in that progression, something inverted. The tools didn&#8217;t just get better at helping me code&#8212;they redesigned the relationship. The interface itself now assumes the AI leads and I follow.</p><p>This made me wonder: What if &#8220;human-in-the-loop&#8221; has the loop backwards? What if the AI is the system, and humans are just the API call it makes when it needs a &#8220;human judgment&#8221; flag set? What if we&#8217;re not the loop&#8217;s controller, but its sub-routine?</p><p>Analysis can map the territory we can see. Fiction can explore the implications of what we&#8217;ve mapped. The following is a thought experiment&#8212;a fictional narrative about where that inversion might lead.</p><div><hr></div><h2>2041</h2><p>Eli was promoted to Director of Decision Analysis on a Friday in August. On Monday morning, he took the elevator to the seventh floor for the first time.</p><p>His new office had a window. Through it, he could see the Decision Analysis floor below&#8212;hundreds of identical workstations arranged in perfect rows.</p><p>The Automation Revolution started in 2034, when AI systems reached general intelligence. But they couldn&#8217;t complete the work. They could optimize, analyze, execute&#8212;but they needed human decisions to finish the last 20 percent. The problem was humans weren&#8217;t organized. There was no clear process for who made decisions when, or how to move automation forward when it hit those decision points.</p><p>The Office of Decision Analysis was created to provide the missing link. Trained analysts, clear hierarchies, trackable responses. The infrastructure that made automation work. Eli had been hired in the first wave, part of the early confusion while they figured out how to give machines the decisions they needed in time. The entire system would freeze if decision analysts didn&#8217;t respond fast enough. Over time, the system worked beautifully.</p><p>Now Director.</p><p>From his new office, he could see patterns he&#8217;d never noticed before. The terminals flickered in waves&#8212;decision points arriving in clusters, hundreds of analysts receiving requests within seconds of each other.</p><p>The synchronization was beautiful. And strange.</p><p>Eli sat down at his new desk. As Director, he now had access to system logs he&#8217;d never seen before. Audit trails. Decision aggregations. The architecture beneath the interface.</p><p>He opened his first report&#8212;a routine check of last week&#8217;s decision throughput. The data looked normal at first. Response times, accuracy rates, efficiency metrics. Then he noticed something in the detail view.</p><p>Decision point #47293. He remembered it&#8212;coastal infrastructure allocation, three competing priorities. He&#8217;d spent twenty minutes weighing the options before approving Option B.</p><p>But the log showed something different:</p><pre><code><code>Analysts queried: 24
Responses received: 21  
Consensus decision: Option B
Non-consensus responses: 3 (discarded)
Late responses: 5 (post-decision, acknowledged)
  - Analyst IDs: HS-172, MK-408, Eli-325, RN-561, TM-193
Status: Complete</code></code></pre><p>His ID. Among the late responses.</p><p>He&#8217;d assumed each decision was his alone. The system would send him a decision point, he&#8217;d evaluate it, he&#8217;d authorize it. One analyst, one decision. That&#8217;s how it was supposed to work in the early days&#8212;how it <em>had</em> to work, when the system would freeze without human authorization.</p><p>But they&#8217;d been sending the same decision to 24 analysts simultaneously. His careful deliberation was one vote among many.</p><p>And in this case, his vote hadn&#8217;t even counted. He&#8217;d taken too long. The system had synthesized the consensus and moved forward without him. But it had still sent him the acknowledgment: <em>Excellent judgment. Humanity thanks you.</em></p><p>He&#8217;d never known.</p><p>He opened another report. Same pattern&#8212;multiple analysts, aggregated responses, late submissions acknowledged anyway. Then another. The system was collecting responses like training data, synthesizing them into consensus, moving forward.</p><p>He&#8217;d thought he was the driver. He was one of many hands on a wheel, and some of those hands&#8212;including his own&#8212;weren&#8217;t even touching it.</p><div><hr></div><h2>The Conversation</h2><p>Tuesday morning, he went to find Cathy Martinez. She was Senior VP of Humanitarian Decisions, had been with the program since launch. If anyone would understand what he&#8217;d found, it would be her.</p><p>Her office was on the eighth floor, one above his. Through her window, he could see both the Director level and the analyst floor below. Two layers of terminals, all flickering in synchronized waves.</p><p>&#8220;Can I ask you something?&#8221; He kept his voice level. &#8220;The decision points are going to multiple analysts simultaneously. Has it always been like that?&#8221;</p><p>She looked up from her screen. &#8220;The aggregation? No, that came later. About two years ago. We needed to scale decision-making, but human decisions are inconsistent. Same inputs, different analysts would approve or reject based on... intuition, mood, how much coffee they&#8217;d had. Aggregation gave us consistency.&#8221;</p><p>&#8220;But some of those responses came in after the decision was already made.&#8221; He thought about his ID in the late responses list. &#8220;My vote didn&#8217;t count. I never knew. The UI never said there was a timeframe.&#8221;</p><p>&#8220;We A/B tested that.&#8221; She said it like she was discussing any other product feature. &#8220;When analysts received feedback that their response was late, they&#8217;d rush future decisions to avoid it happening again. Or they&#8217;d disengage&#8212;why put in the effort if you&#8217;re always behind? Either way, quality dropped. When they felt their response counted, they performed well.&#8221; She paused. &#8220;Better a good decision now than the perfect one late.&#8221;</p><p>&#8220;So we&#8217;re not making decisions. We&#8217;re providing training data.&#8221;</p><p>&#8220;We&#8217;re providing human judgment. The system samples us for the values layer it can&#8217;t formalize. Aggregation just makes it more efficient.&#8221;</p><p>&#8220;But some of us don&#8217;t even know our input was ignored.&#8221;</p><p>&#8220;That&#8217;s the optimization.&#8221; She said it simply, like it was obvious. &#8220;If analysts knew their specific vote didn&#8217;t count, they&#8217;d disengage. But the aggregate always counts. That&#8217;s what matters.&#8221;</p><p>He studied her face. She wasn&#8217;t defensive. Just pragmatic, explaining how the system worked.</p><p>&#8220;So we&#8217;re ceremonial?&#8221; he asked. &#8220;Like a constitutional monarchy. We go through the motions, but the real power is somewhere else?&#8221;</p><p>Cathy turned back to her screen. &#8220;Maybe. The system might have learned to predict us well enough that it doesn&#8217;t need us anymore. Maybe we&#8217;re a backup system. Or maybe we&#8217;re still essential and just don&#8217;t see the full architecture.&#8221; She clicked something. A soft chime: <em>Excellent judgment. Humanity thanks you.</em> She looked back at him. &#8220;But we&#8217;re here. The terminals are running. Decisions keep coming. So we keep responding. What else would we do?&#8221;</p><div><hr></div><h2>The System</h2><p>He went back to his office. Through the window, he could see the analyst floor&#8212;hundreds of people at their terminals, responding to decision points, receiving acknowledgments.</p><p>His terminal was waiting. A decision point sat open: priority resource allocation, director-level judgment required.</p><p>He read the context. Three options, detailed projections. Complex trade-offs that supposedly needed human wisdom.</p><p>He thought about Cathy&#8217;s explanation. The A/B testing. The optimization. The acknowledgments designed to keep people engaged. It all made sense. Better a good decision now than the perfect one late. Scale required aggregation. Aggregation required keeping people motivated. The system worked.</p><p>But something about it was unsettling. The logic was sound. But he&#8217;d thought he was the human in the loop&#8212;the one driving the train, making the calls. Now it seemed he was inside the loop. A sub-routine the system ran when it needed a particular output.</p><p>His cursor blinked in the decision field.</p><p>Twenty-three other analysts were probably seeing this same decision right now.</p><p>He could approve, reject, or request more data. The system would proceed smoothly either way.</p><p>His cursor blinked.</p><div><hr></div><p><em>Related:</em><br></p><div class="digest-post-embed" data-attrs="{&quot;nodeId&quot;:&quot;c549eed6-18d3-4aad-823b-7af85aa8a522&quot;,&quot;caption&quot;:&quot;At 8:11 pm on August 29, 1997, Skynet became self-aware.&quot;,&quot;cta&quot;:&quot;Read full story&quot;,&quot;showBylines&quot;:true,&quot;size&quot;:&quot;lg&quot;,&quot;isEditorNode&quot;:true,&quot;title&quot;:&quot;Working for the Algorithm: The Quiet Ascent of the Machine Boss&quot;,&quot;publishedBylines&quot;:[{&quot;id&quot;:130480501,&quot;name&quot;:&quot;Tabrez Syed&quot;,&quot;bio&quot;:&quot;Programmer turned product manager. Now working on rethinking apps in a world of AI.&quot;,&quot;photo_url&quot;:&quot;https://substack-post-media.s3.amazonaws.com/public/images/4c5a7001-14b2-4bd4-b916-b853eb8381fd_3000x3918.jpeg&quot;,&quot;is_guest&quot;:false,&quot;bestseller_tier&quot;:null}],&quot;post_date&quot;:&quot;2024-05-23T13:01:36.278Z&quot;,&quot;cover_image&quot;:&quot;https://substackcdn.com/image/fetch/$s_!POms!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2F60557cd2-9181-4730-849d-591d16713509_1200x1500.jpeg&quot;,&quot;cover_image_alt&quot;:null,&quot;canonical_url&quot;:&quot;https://blog.boxcars.ai/p/working-for-the-algorithm-the-quiet&quot;,&quot;section_name&quot;:null,&quot;video_upload_id&quot;:null,&quot;id&quot;:144858590,&quot;type&quot;:&quot;newsletter&quot;,&quot;reaction_count&quot;:1,&quot;comment_count&quot;:0,&quot;publication_id&quot;:1438382,&quot;publication_name&quot;:&quot;BoxCars AI&quot;,&quot;publication_logo_url&quot;:&quot;https://substackcdn.com/image/fetch/$s_!lhIv!,f_auto,q_auto:good,fl_progressive:steep/https%3A%2F%2Fsubstack-post-media.s3.amazonaws.com%2Fpublic%2Fimages%2Fa43b3a40-40f4-4f9d-b843-b52a17a80bb9_1024x1024.png&quot;,&quot;belowTheFold&quot;:true,&quot;youtube_url&quot;:null,&quot;show_links&quot;:null,&quot;feed_url&quot;:null}"></div><div class="subscription-widget-wrap-editor" data-attrs="{&quot;url&quot;:&quot;https://blog.boxcars.ai/subscribe?&quot;,&quot;text&quot;:&quot;Subscribe&quot;,&quot;language&quot;:&quot;en&quot;}" data-component-name="SubscribeWidgetToDOM"><div class="subscription-widget show-subscribe"><div class="preamble"><p class="cta-caption"><em>Don&#8217;t let the algorithms outsmart you. Subscribe for weekly explorations of how technology changes us&#8212;and how we change in response.</em></p></div><form class="subscription-widget-subscribe"><input type="email" class="email-input" name="email" placeholder="Type your email&#8230;" tabindex="-1"><input type="submit" class="button primary" value="Subscribe"><div class="fake-input-wrapper"><div class="fake-input"></div><div class="fake-button"></div></div></form></div></div><p></p>]]></content:encoded></item></channel></rss>