<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9"
        xmlns:news="http://www.google.com/schemas/sitemap-news/0.9">
  <url>
    <loc>https://devtoolsfeed.com/article/time-when-more-layers-meant-worse-model-birth-of-residual/</loc>
    <news:news>
      <news:publication>
        <news:name>DevTools Feed</news:name>
        <news:language>en</news:language>
      </news:publication>
      <news:publication_date>2026-05-27T19:26:10.510780+00:00</news:publication_date>
      <news:title>Beyond Vanishing Gradients: The Power of the Residual Connection</news:title>
      <news:keywords>deep learning, neural networks, residual connections, transformer architecture, vanishing gradients</news:keywords>
    </news:news>
  </url>
</urlset>
