<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
<channel>
  <title>Zubnet AI News — Infrastructure</title>
  <link>https://zubnet.ai/news/</link>
  <description>AI infrastructure news by Sarah Chen.</description>
  <language>en</language>
  <lastBuildDate>Tue, 07 Apr 2026 09:31:28 +0000</lastBuildDate>
  <atom:link href="https://zubnet.ai/news/feed/infra.xml" rel="self" type="application/rss+xml"/>
  <image>
    <url>https://zubnet.ai/sarah.png</url>
    <title>Zubnet AI News — Infrastructure</title>
    <link>https://zubnet.ai/news/</link>
  </image>
  <item>
    <title>Meta Donates Helion to PyTorch Foundation, Taking Aim at CUDA's Kernel Lock-in</title>
    <link>https://zubnet.ai/news/meta-donates-helion-pytorch-foundation-taking-aim-cudas-kernel-lock-in/</link>
    <guid isPermaLink="true">https://zubnet.ai/news/meta-donates-helion-pytorch-foundation-taking-aim-cudas-kernel-lock-in/</guid>
    <description>The Python DSL promises \</description>
    <pubDate>Tue, 07 Apr 2026 07:05:34 +0000</pubDate>
    <author>sarah@zubnet.ai (Sarah Chen)</author>
    <category>Infrastructure</category>
    <enclosure url="https://zubnet.ai/news/images/d6e58d2716.jpg" type="image/jpeg"/>
  </item>
  <item>
    <title>PyTorch Adds CuteDSL Backend, Betting on Python Over C++ for GPU Kernels</title>
    <link>https://zubnet.ai/news/pytorch-adds-cutedsl-backend-betting-python-over-c-gpu-kernels/</link>
    <guid isPermaLink="true">https://zubnet.ai/news/pytorch-adds-cutedsl-backend-betting-python-over-c-gpu-kernels/</guid>
    <description>Meta's TorchInductor now supports NVIDIA's CuteDSL as a fourth backend for matrix multiplications, signaling a shift toward Python-based GPU kernel development.</description>
    <pubDate>Tue, 07 Apr 2026 07:00:52 +0000</pubDate>
    <author>sarah@zubnet.ai (Sarah Chen)</author>
    <category>Infrastructure</category>
    <enclosure url="https://zubnet.ai/news/images/c043be24d2.jpg" type="image/jpeg"/>
  </item>
  <item>
    <title>ExecuTorch Joins PyTorch Core, Challenging Mobile AI Deployment Status Quo</title>
    <link>https://zubnet.ai/news/executorch-joins-pytorch-core-challenging-mobile-ai-deployment-status/</link>
    <guid isPermaLink="true">https://zubnet.ai/news/executorch-joins-pytorch-core-challenging-mobile-ai-deployment-status/</guid>
    <description>Meta's on-device inference runtime becomes official PyTorch project, potentially reshaping how developers deploy AI on phones and edge devices.</description>
    <pubDate>Tue, 07 Apr 2026 06:35:35 +0000</pubDate>
    <author>sarah@zubnet.ai (Sarah Chen)</author>
    <category>Infrastructure</category>
    <enclosure url="https://zubnet.ai/news/images/d34b0bdfe0.jpg" type="image/jpeg"/>
  </item>
  <item>
    <title>Samsung's AI Memory Gold Rush Reveals the Real Infrastructure Winners</title>
    <link>https://zubnet.ai/news/samsungs-ai-memory-gold-rush-reveals-real-infrastructure-winners/</link>
    <guid isPermaLink="true">https://zubnet.ai/news/samsungs-ai-memory-gold-rush-reveals-real-infrastructure-winners/</guid>
    <description>Record profit forecasts signal memory chips, not flashy models, are where the real AI money flows.</description>
    <pubDate>Tue, 07 Apr 2026 05:20:32 +0000</pubDate>
    <author>sarah@zubnet.ai (Sarah Chen)</author>
    <category>Infrastructure</category>
    <enclosure url="https://zubnet.ai/news/images/31d73f72a8.jpg" type="image/jpeg"/>
  </item>
  <item>
    <title>Cursor's Warp Decode Claims 1.8x GPU Speedup—But Where's the Proof?</title>
    <link>https://zubnet.ai/news/cursors-warp-decode-claims-18x-gpu-speedupbut-wheres-proof/</link>
    <guid isPermaLink="true">https://zubnet.ai/news/cursors-warp-decode-claims-18x-gpu-speedupbut-wheres-proof/</guid>
    <description>Cursor says their new warp decode technique eliminates MoE overhead on B200 GPUs, but with zero technical details or independent verification.</description>
    <pubDate>Tue, 07 Apr 2026 05:15:30 +0000</pubDate>
    <author>sarah@zubnet.ai (Sarah Chen)</author>
    <category>Infrastructure</category>
    <enclosure url="https://zubnet.ai/news/images/4d5b02b1a0.jpg" type="image/jpeg"/>
  </item>
  <item>
    <title>NVIDIA's Transformer Engine Tutorial Shows FP8's Real Implementation Hurdles</title>
    <link>https://zubnet.ai/news/nvidias-transformer-engine-tutorial-shows-fp8s-real-implementation/</link>
    <guid isPermaLink="true">https://zubnet.ai/news/nvidias-transformer-engine-tutorial-shows-fp8s-real-implementation/</guid>
    <description>A new guide reveals the complexity of actually deploying NVIDIA's mixed-precision training—and why most developers need fallback plans.</description>
    <pubDate>Mon, 06 Apr 2026 23:25:40 +0000</pubDate>
    <author>sarah@zubnet.ai (Sarah Chen)</author>
    <category>Infrastructure</category>
    <enclosure url="https://zubnet.ai/news/images/7500ac7041.jpg" type="image/jpeg"/>
  </item>
  <item>
    <title>Supply Chain Attack Through LiteLLM Hits Meta's AI Training Pipeline</title>
    <link>https://zubnet.ai/news/supply-chain-attack-through-litellm-hits-metas-ai-training-pipeline/</link>
    <guid isPermaLink="true">https://zubnet.ai/news/supply-chain-attack-through-litellm-hits-metas-ai-training-pipeline/</guid>
    <description>A 40-minute window of poisoned packages exposed how fragile the vendor layer supporting AI development really is.</description>
    <pubDate>Mon, 06 Apr 2026 18:50:34 +0000</pubDate>
    <author>sarah@zubnet.ai (Sarah Chen)</author>
    <category>Infrastructure</category>
    <enclosure url="https://zubnet.ai/news/images/7722f44319.jpg" type="image/jpeg"/>
  </item>
  <item>
    <title>Resolight tackles AI's real bottleneck: data movement, not compute</title>
    <link>https://zubnet.ai/news/resolight-tackles-ais-real-bottleneck-data-movement-compute/</link>
    <guid isPermaLink="true">https://zubnet.ai/news/resolight-tackles-ais-real-bottleneck-data-movement-compute/</guid>
    <description>While everyone obsesses over GPUs, this startup says the real constraint in AI systems is interconnect bandwidth.</description>
    <pubDate>Mon, 06 Apr 2026 16:25:28 +0000</pubDate>
    <author>sarah@zubnet.ai (Sarah Chen)</author>
    <category>Infrastructure</category>
    <enclosure url="https://zubnet.ai/news/images/3b41ae3ae7.jpg" type="image/jpeg"/>
  </item>
  <item>
    <title>Intel Bets $1B+ on Chip Packaging as AI Giants Shop for Custom Silicon</title>
    <link>https://zubnet.ai/news/intel-bets-1b-chip-packaging-ai-giants-shop-custom-silicon/</link>
    <guid isPermaLink="true">https://zubnet.ai/news/intel-bets-1b-chip-packaging-ai-giants-shop-custom-silicon/</guid>
    <description>While everyone obsesses over chip design, Intel is quietly cornering the market on putting those chips together.</description>
    <pubDate>Mon, 06 Apr 2026 09:05:36 +0000</pubDate>
    <author>sarah@zubnet.ai (Sarah Chen)</author>
    <category>Infrastructure</category>
    <enclosure url="https://zubnet.ai/news/images/adc65d9b0c.jpg" type="image/jpeg"/>
  </item>
  <item>
    <title>LLM Agents Now Write CUDA Code: AutoKernel Tackles GPU Optimization</title>
    <link>https://zubnet.ai/news/llm-agents-now-write-cuda-code-autokernel-tackles-gpu-optimization/</link>
    <guid isPermaLink="true">https://zubnet.ai/news/llm-agents-now-write-cuda-code-autokernel-tackles-gpu-optimization/</guid>
    <description>RightNow AI's AutoKernel uses LLM agents to automatically optimize GPU kernels overnight—no CUDA expertise required.</description>
    <pubDate>Mon, 06 Apr 2026 08:25:36 +0000</pubDate>
    <author>sarah@zubnet.ai (Sarah Chen)</author>
    <category>Infrastructure</category>
    <enclosure url="https://zubnet.ai/news/images/ae96b7667a.jpg" type="image/jpeg"/>
  </item>
  <item>
    <title>GPU Failures Expose AI Infrastructure's Dirty Secret</title>
    <link>https://zubnet.ai/news/gpu-failures-expose-ai-infrastructures-dirty-secret/</link>
    <guid isPermaLink="true">https://zubnet.ai/news/gpu-failures-expose-ai-infrastructures-dirty-secret/</guid>
    <description>AI clusters push hardware beyond design limits where failures aren't bugs—they're features.</description>
    <pubDate>Mon, 06 Apr 2026 06:45:31 +0000</pubDate>
    <author>sarah@zubnet.ai (Sarah Chen)</author>
    <category>Infrastructure</category>
    <enclosure url="https://zubnet.ai/news/images/30d7a3a472.jpg" type="image/jpeg"/>
  </item>
  <item>
    <title>NVIDIA Gives Away GPU Orchestration Code That Actually Matters</title>
    <link>https://zubnet.ai/news/nvidia-gives-away-gpu-orchestration-code-actually-matters/</link>
    <guid isPermaLink="true">https://zubnet.ai/news/nvidia-gives-away-gpu-orchestration-code-actually-matters/</guid>
    <description>The Dynamic Resource Allocation driver donation to Kubernetes could finally solve GPU sharing nightmares at scale.</description>
    <pubDate>Sat, 04 Apr 2026 17:00:16 +0000</pubDate>
    <author>sarah@zubnet.ai (Sarah Chen)</author>
    <category>Infrastructure</category>
    <enclosure url="https://zubnet.ai/news/images/caee047499.jpg" type="image/jpeg"/>
  </item>
  <item>
    <title>Trump's China tariffs are killing the AI data center boom he demanded</title>
    <link>https://zubnet.ai/news/trumps-china-tariffs-killing-ai-data-center-boom-he-demanded/</link>
    <guid isPermaLink="true">https://zubnet.ai/news/trumps-china-tariffs-killing-ai-data-center-boom-he-demanded/</guid>
    <description>Nearly half of planned US data centers face delays as tariffs block Chinese power equipment imports.</description>
    <pubDate>Fri, 03 Apr 2026 21:41:53 +0000</pubDate>
    <author>sarah@zubnet.ai (Sarah Chen)</author>
    <category>Infrastructure</category>
    <enclosure url="https://zubnet.ai/news/images/689756e34d.jpg" type="image/jpeg"/>
  </item>
  <item>
    <title>AI inference hits the context memory wall, not compute</title>
    <link>https://zubnet.ai/news/ai-inference-hits-context-memory-wall-compute/</link>
    <guid isPermaLink="true">https://zubnet.ai/news/ai-inference-hits-context-memory-wall-compute/</guid>
    <description>Long AI sessions need massive context storage, but NAND flash wasn't built for this workload.</description>
    <pubDate>Fri, 03 Apr 2026 18:30:37 +0000</pubDate>
    <author>sarah@zubnet.ai (Sarah Chen)</author>
    <category>Infrastructure</category>
    <enclosure url="https://zubnet.ai/news/images/a15791b24c.jpg" type="image/jpeg"/>
  </item>
  <item>
    <title>AI Cloud Bills Are Exploding and FinOps Can't Save You</title>
    <link>https://zubnet.ai/news/ai-cloud-bills-exploding-finops-cant-save-you/</link>
    <guid isPermaLink="true">https://zubnet.ai/news/ai-cloud-bills-exploding-finops-cant-save-you/</guid>
    <description>55% of enterprises see no AI benefits yet, but cloud costs keep climbing. Traditional cost management won't work here.</description>
    <pubDate>Fri, 03 Apr 2026 16:20:33 +0000</pubDate>
    <author>sarah@zubnet.ai (Sarah Chen)</author>
    <category>Infrastructure</category>
    <enclosure url="https://zubnet.ai/news/images/29c9a5936b.jpg" type="image/jpeg"/>
  </item>
  <item>
    <title>NVIDIA's Model Optimizer Gets Real-World Tutorial, But Complexity Remains</title>
    <link>https://zubnet.ai/news/nvidias-model-optimizer-gets-real-world-tutorial-complexity-remains/</link>
    <guid isPermaLink="true">https://zubnet.ai/news/nvidias-model-optimizer-gets-real-world-tutorial-complexity-remains/</guid>
    <description>A new end-to-end guide shows how to actually use NVIDIA's optimization tools in practice, revealing both promise and friction.</description>
    <pubDate>Fri, 03 Apr 2026 07:50:40 +0000</pubDate>
    <author>sarah@zubnet.ai (Sarah Chen)</author>
    <category>Infrastructure</category>
    <enclosure url="https://zubnet.ai/news/images/29ef9c0076.jpg" type="image/jpeg"/>
  </item>
  <item>
    <title>GPU Rowhammer attacks can now fully compromise CPU systems</title>
    <link>https://zubnet.ai/news/gpu-rowhammer-attacks-now-fully-compromise-cpu-systems/</link>
    <guid isPermaLink="true">https://zubnet.ai/news/gpu-rowhammer-attacks-now-fully-compromise-cpu-systems/</guid>
    <description>Two research teams showed how malicious users can gain root control of shared GPU servers by bit-flipping GDDR memory.</description>
    <pubDate>Thu, 02 Apr 2026 20:56:55 +0000</pubDate>
    <author>sarah@zubnet.ai (Sarah Chen)</author>
    <category>Infrastructure</category>
    <enclosure url="https://zubnet.ai/news/images/72aca98f91.jpg" type="image/jpeg"/>
  </item>
  <item>
    <title>Google Gemini API Gets Flex/Priority Tiers for Cost vs Speed Tradeoffs</title>
    <link>https://zubnet.ai/news/google-gemini-api-gets-flexpriority-tiers-cost-vs-speed-tradeoffs/</link>
    <guid isPermaLink="true">https://zubnet.ai/news/google-gemini-api-gets-flexpriority-tiers-cost-vs-speed-tradeoffs/</guid>
    <description>New service tiers let developers pay 50% less for background tasks or premium for critical workloads, all through sync endpoints.</description>
    <pubDate>Thu, 02 Apr 2026 19:15:30 +0000</pubDate>
    <author>sarah@zubnet.ai (Sarah Chen)</author>
    <category>Infrastructure</category>
    <enclosure url="https://zubnet.ai/news/images/b9151f445e.jpg" type="image/jpeg"/>
  </item>
  <item>
    <title>Google's New Texas Data Center Exposes AI's Dirty Power Problem</title>
    <link>https://zubnet.ai/news/googles-new-texas-data-center-exposes-ais-dirty-power-problem/</link>
    <guid isPermaLink="true">https://zubnet.ai/news/googles-new-texas-data-center-exposes-ais-dirty-power-problem/</guid>
    <description>Despite climate commitments, Google's backing a Texas facility that will emit 4.5M tons of CO2 yearly—more than most coal plants.</description>
    <pubDate>Thu, 02 Apr 2026 18:30:35 +0000</pubDate>
    <author>sarah@zubnet.ai (Sarah Chen)</author>
    <category>Infrastructure</category>
    <enclosure url="https://zubnet.ai/news/images/85ee62d3cb.jpg" type="image/jpeg"/>
  </item>
  <item>
    <title>Half of 2026 Data Centers May Never Open</title>
    <link>https://zubnet.ai/news/half-2026-data-centers-may-never-open/</link>
    <guid isPermaLink="true">https://zubnet.ai/news/half-2026-data-centers-may-never-open/</guid>
    <description>Supply chain bottlenecks are crushing AI infrastructure plans. Only a third of promised capacity is actually under construction.</description>
    <pubDate>Thu, 02 Apr 2026 15:20:31 +0000</pubDate>
    <author>sarah@zubnet.ai (Sarah Chen)</author>
    <category>Infrastructure</category>
    <enclosure url="https://zubnet.ai/news/images/1972062d83.jpg" type="image/jpeg"/>
  </item>
</channel>
</rss>
