It looks like this is a web page, not a feed. I looked for a feed associated with this page, but couldn't find one. Please enter the address of your feed to validate.

Source: http://www.sebastianraschka.com/rss_feed.xml

  1. <!DOCTYPE html>
  2. <html lang="en">
  3.  
  4.  <head>
  5.  <meta charset="utf-8">
  6.  <meta name="viewport" content="width=device-width initial-scale=1" />
  7.  <meta http-equiv="X-UA-Compatible" content="IE=edge">
  8.  
  9.  <meta name="author" content="Sebastian Raschka">
  10.  <meta property="og:title" content="
  11.    Sebastian Raschka
  12.  ">
  13.  
  14.  <meta property="og:description" content="
  15.    I'm an LLM Research Engineer with over a decade of experience in artificial intelligence. My work bridges academia and industry, with roles including senior staff at an AI company and a statistics professor. My expertise lies in LLM research and the development of high-performance AI systems, with a deep focus on practical, code-driven implementations.
  16.  
  17.  ">
  18.  
  19.  <meta property="og:url" content="https://sebastianraschka.com/" />
  20.  <meta property="og:site_name" content="Sebastian Raschka, PhD" />
  21.  <meta property="og:locale" content="en_US" />
  22.  <meta property="og:type" content="article" />
  23.  <meta property="article:published_time" content="" />
  24.  
  25.  
  26.  
  27.    <meta property="og:image" content="https://sebastianraschka.com/images/logos/hero.jpg" />
  28.  
  29.  
  30.  <meta name="twitter:site" content="@rasbt" />
  31.  <meta name="twitter:creator" content="@rasbt" />
  32.  <meta name="twitter:title" content="Sebastian Raschka" />
  33.  <meta name="twitter:description" content="
  34.    I'm an LLM Research Engineer with over a decade of experience in artificial intelligence. My work bridges academia and industry, with roles including senior staff at an AI company and a statistics professor. My expertise lies in LLM research and the development of high-performance AI systems, with a deep focus on practical, code-driven implementations.
  35.  
  36.  " />
  37.  
  38.  
  39.    <meta name="twitter:card" content="summary_large_image">
  40.    <meta name="twitter:image" content="https://sebastianraschka.com/images/logos/hero.jpg">
  41.  
  42.  
  43.  <title>Sebastian Raschka</title>
  44.  <meta name="description" content="I'm an LLM Research Engineer with over a decade of experience in artificial intelligence. My work bridges academia and industry, with roles including senior staff at an AI company and a statistics professor. My expertise lies in LLM research and the development of high-performance AI systems, with a deep focus on practical, code-driven implementations.
  45. ">
  46.  <link rel="stylesheet" href="/css/combined_direct_no_sass.css">
  47.  <link rel="stylesheet" href="/css/fork-awesome.min.css">
  48.  <meta property='og:title' content="Sebastian Raschka">
  49. <meta property="og:type" content="article">
  50. <meta property="og:url" content="https://sebastianraschka.com/">
  51.  
  52.  
  53.  <meta property="og:image" content="">
  54.  
  55.  
  56. <meta property="og:description" content="">
  57. <meta property="og:site_name" content="Sebastian Raschka, PhD">
  58. <meta property="og:locale" content="en_US">
  59.  
  60.  
  61. <meta property="fb:admins" content="">
  62. <meta property="fb:app_id" content="">
  63.  
  64.  
  65.  
  66.    <link rel="canonical" href="https://sebastianraschka.com/">
  67.  
  68.  
  69.  <link rel="icon" type="image/png" sizes="32x32" href="/images/favicons/favicon-32x32.png">
  70.  <link rel="icon" type="image/png" sizes="16x16" href="/images/favicons/favicon-16x16.png">
  71.  <link rel="manifest" href="/site.webmanifest">
  72.  <link rel="mask-icon" href="/images/favicons/safari-pinned-tab.svg" color="#5bbad5">
  73.  <meta name="msapplication-TileColor" content="#ffc40d">
  74.  <meta name="theme-color" content="#ffffff">
  75.  
  76.  
  77.  <body>
  78.    <img src="/images/logos/ahead-of-ai-icon.png" alt="Ahead of AI logo" style="display: none;">
  79.  
  80. <header class="site-header">
  81.  
  82.      <div class="site-title" style="text-decoration: none; margin-top: 2em;">
  83.        <a href="/"><span style="color:black">Sebastian</span> <span style="color:#c5050c">Raschka</span> </a>
  84.        <a href="https://x.com/rasbt"><img src="/images/logos/twitter-bw.jpg" height="20" style="padding-left:20px;" alt="Twitter/X icon"></a>
  85.        <!--<a href="https://threads.net/@sebastianraschka"><img src="/images/logos/threads-logo-alt-small.png" height="20" style="padding-left:5px;" alt="Threads icon"></a>-->
  86.        <a href="https://www.linkedin.com/in/sebastianraschka/"><img src="/images/logos/linkedin-bw.jpg" height="20" style="padding-left:5px;" alt="LinkedIn Icon"></a>
  87.        <a href="https://github.com/rasbt"><img src="/images/logos/github-bw.jpg" height="20" style="padding-left:5px;" alt="GitHub icon"></a>
  88.  
  89.      </div>
  90.  
  91.  
  92.  
  93.     <!--  <div style="width:100%;height:50;float:left;margin-bottom:10px;">
  94.        &nbsp;<a href="https://twitter.com/rasbt"><img src="/images/logos/twitter-bw.jpg" height="20"></a>-->
  95.        <!-- &nbsp;<a href="https://www.buymeacoffee.com/rasbt"><img src="/images/logos/coffee-bw.jpg" height="20"></a>-->
  96.        <!--&nbsp;<a href="https://mastodon.social/@SebRaschka"><img src="/images/logos/mastodon-bw.jpg" height="20"></a>-->
  97.  
  98.     <!-- </div>-->
  99.  
  100.  
  101.  <div class="wrapper">
  102.  
  103.    <nav class="site-nav">
  104.      <a href="#" class="menu-icon">
  105.        <svg viewBox="0 0 18 15">
  106.          <path fill="#424242" d="M18,1.484c0,0.82-0.665,1.484-1.484,1.484H1.484C0.665,2.969,0,2.304,0,1.484l0,0C0,0.665,0.665,0,1.484,0 h15.031C17.335,0,18,0.665,18,1.484L18,1.484z"/>
  107.          <path fill="#424242" d="M18,7.516C18,8.335,17.335,9,16.516,9H1.484C0.665,9,0,8.335,0,7.516l0,0c0-0.82,0.665-1.484,1.484-1.484 h15.031C17.335,6.031,18,6.696,18,7.516L18,7.516z"/>
  108.          <path fill="#424242" d="M18,13.516C18,14.335,17.335,15,16.516,15H1.484C0.665,15,0,14.335,0,13.516l0,0 c0-0.82,0.665-1.484,1.484-1.484h15.031C17.335,12.031,18,12.696,18,13.516L18,13.516z"/>
  109.        </svg>
  110.      </a>
  111.  
  112.  
  113.  
  114.  
  115.      <div class="trigger">
  116.  
  117.  
  118.  
  119.        <!--<script type="text/javascript">
  120.          var total_images = 2;
  121.          var random_number = Math.floor((Math.random()*total_images));
  122.          var random_img = new Array();
  123.          random_img[0] = '<a href="https://twitter.com/rasbt"><img src="/images/logos/twitter-1.jpg" height="20"></a>';
  124.          random_img[1] = '<a href="https://linkedin.com/in/sebastianraschka"><img src="/images/logos/linkedin-1.jpg" height="20"></a>';
  125.          document.write(random_img[random_number]);
  126.          </script>-->
  127.  
  128.        <span style="padding-left:0px;margin-left:0px;"></span>
  129.        <a class="page-link" href="https://magazine.sebastianraschka.com"><span style="color:#c5050c;"><img src="/images/logos/ahead-of-ai-icon.png" alt="Ahead of AI Logo" height="20"> Blog</span></a>
  130.        <!--<a class="page-link" href="/blog/index.html">Blog</a>-->
  131.        <a class="page-link" href="/books">Books</a>
  132.        <!--<a class="page-link" href="/newsletter">AI Newsletter</a>-->
  133.        <a class="page-link" href="/teaching">Courses</a>
  134.        <a class="page-link" href="https://github.com/rasbt/LLMs-from-scratch">LLMs From Scratch</a>
  135.        <!--<a class="page-link" href="/publications">Research</a>-->
  136.        <a class="page-link" href="/elsewhere">Talks</a>
  137.        <a class="page-link" href="/contact">Contact</a>
  138.        <a class="page-link" href="/resources">More</a>
  139.  
  140.  
  141.      </div>
  142.  
  143.  
  144.    </nav>
  145.  
  146.  
  147.  </div>
  148.  
  149. </header>
  150.  
  151.  
  152.    <div class="page-content">
  153.      <div class="wrapper">
  154.        <div style="display: flex; align-items: center; justify-content: center; flex-wrap: wrap; max-width: 800px; margin: 40px auto; gap: 30px;">
  155.    <div style="flex: 1; min-width: 300px; text-align: left;">
  156.        <h1 style="font-size: 1.8em; font-weight: 600; color: #222; margin-bottom: 20px;">
  157.            Hello, I'm Sebastian Raschka, PhD
  158.        </h1>
  159.        <p style="font-size: 1.1em; line-height: 1.8; color: #555; margin-bottom: 20px;">
  160.            I'm an LLM Research Engineer with over a decade of experience in artificial intelligence. My work bridges academia and industry, with roles including senior staff at an AI company and a statistics professor.
  161.        </p>
  162.        <p style="font-size: 1.1em; line-height: 1.8; color: #555; margin-bottom: 20px;">
  163.            My expertise lies in LLM research and the development of high-performance AI systems, with a deep focus on practical, code-driven implementations.
  164.            (For my most up-to-date CV details, please visit my <a href="https://www.linkedin.com/in/sebastianraschka">LinkedIn profile</a>.)
  165.        </p>
  166.    </div>
  167.    <div style="flex: 0 0 200px; text-align: center;">
  168.        <picture>
  169.            <source type="image/webp" srcset="/images/logos/photo-2021-08-25_compressed.webp">
  170.            <source type="image/jpeg" srcset="/images/logos/photo-2021-08-25_compressed.jpg">
  171.            <img src="/images/logos/photo-2021-08-25_compressed.jpg" alt="Sebastian Raschka Profile Picture" style="width: 200px; height: 200px; object-fit: cover; object-position: 100% 10%; border-radius: 50%; box-shadow: 0 4px 10px rgba(0,0,0,0.1);">
  172.        </picture>
  173.    </div>
  174. </div>
  175.  
  176.  
  177. <!-- Subscribe Section -->
  178. <div class="rss" style="display: flex; align-items: center; justify-content: center; width: 96%; margin: 20px auto; max-width: 800px;">
  179.    <a href="/rss_feed.xml" style="display: inline-flex; align-items: center; margin-right: 20px;">
  180.        <i class="fa fa-rss fa-1x" style="padding-right: 5px;"></i>
  181.        <span>RSS Feed (Blog and Notes)</span>
  182.    </a>
  183.    <a class="page-link" href="https://magazine.sebastianraschka.com/subscribe" style="display: inline-flex; align-items: center;">
  184.        <img src="/images/logos/ahead-of-ai-icon.png" alt="Ahead of AI Logo" height="20" style="padding-right: 5px;">
  185.        <span>Subscribe via Email (AI Magazine)</span>
  186.    </a>
  187. </div>
  188.  
  189. <div style="height: 50px;"></div>
  190.  
  191. <!-- Blog Entries Section -->
  192. <div style="max-width: 800px; margin: 30px auto;">
  193.    <blockquote>
  194.        <!-- Content about Sebastian -->
  195.    </blockquote>
  196.  
  197.    <div class="post">
  198.        <header class="post-header">
  199.            <h1 class="post-title">Recent Notes and Blog Entries</h1>
  200.        </header>
  201.  
  202.        <div style="margin-bottom: 45px; text-align: center;">
  203.            See <a href="/blog/">Blog and Notes Archive</a> for all entries.
  204.        </div>
  205.  
  206.        <article class="post-content posts-by-year">
  207.            
  208.            
  209.                
  210.  
  211.                <div class="post-entry">
  212.                    
  213.                        <div class="post-hero-image">
  214.                            <img src="/images/blog/2025/from-gpt-2-to-gpt-oss/hero.jpg" alt="From GPT-2 to gpt-oss: Analyzing the Architectural Advances">
  215.                        </div>
  216.                    
  217.                    <div class="post-details">
  218.                        <h2 class="post-title">
  219.                            <a href="/blog/2025/from-gpt-2-to-gpt-oss.html">From GPT-2 to gpt-oss: Analyzing the Architectural Advances</a>
  220.                        </h2>
  221.                        <p class="post-date">Aug 9, 2025</p>
  222.                        <p class="post-description">OpenAI just released their new open-weight LLMs this week: gpt-oss-120b and gpt-oss-20b, their first open-weight models since GPT-2 in 2019. And yes, thanks to some clever optimizations, they can run locally. I spent the past few days reading through the code and technical reports to summarize the most interesting details.</p>
  223.                    </div>
  224.                </div>
  225.  
  226.                
  227.            
  228.                
  229.  
  230.                <div class="post-entry">
  231.                    
  232.                        <div class="post-hero-image">
  233.                            <img src="/images/blog/2025/the-big-llm-architecture-comparison/hero.jpg" alt="The Big LLM Architecture Comparison">
  234.                        </div>
  235.                    
  236.                    <div class="post-details">
  237.                        <h2 class="post-title">
  238.                            <a href="/blog/2025/the-big-llm-architecture-comparison.html">The Big LLM Architecture Comparison</a>
  239.                        </h2>
  240.                        <p class="post-date">Jul 19, 2025</p>
  241.                        <p class="post-description">It has been seven years since the original GPT architecture was developed. At first glance, looking back at GPT-2 (2019) and forward to DeepSeek-V3 and Llama 4 (2024-2025), one might be surprised at how structurally similar these models still are. Comparing LLMs to determine the key ingredients that contribute to their good (or not-so-good) performance is notoriously challenging: datasets, training techniques, and hyperparameters vary widely and are often not well documented. However, I think that there is still a lot of value in examining the structural changes of the architectures themselves to see what LLM developers are up to in 2025.</p>
  242.                    </div>
  243.                </div>
  244.  
  245.                
  246.            
  247.                
  248.  
  249.                <div class="post-entry">
  250.                    
  251.                        <div class="post-hero-image">
  252.                            <img src="/images/blog/2025/llm-research-papers-the-2025-list-january-to-june/hero.jpeg" alt="LLM Research Papers: The 2025 List (January to June)">
  253.                        </div>
  254.                    
  255.                    <div class="post-details">
  256.                        <h2 class="post-title">
  257.                            <a href="/blog/2025/llm-research-papers-the-2025-list-january-to-june.html">LLM Research Papers: The 2025 List (January to June)</a>
  258.                        </h2>
  259.                        <p class="post-date">Jul 1, 2025</p>
  260.                        <p class="post-description">The latest in LLM research with a hand-curated, topic-organized list of over 200 research papers from 2025.</p>
  261.                    </div>
  262.                </div>
  263.  
  264.                
  265.            
  266.                
  267.  
  268.                <div class="post-entry">
  269.                    
  270.                        <div class="post-hero-image">
  271.                            <img src="/images/blog/2025/coding-the-kv-cache-in-llms/hero.jpg" alt="Understanding and Coding the KV Cache in LLMs from Scratch">
  272.                        </div>
  273.                    
  274.                    <div class="post-details">
  275.                        <h2 class="post-title">
  276.                            <a href="/blog/2025/coding-the-kv-cache-in-llms.html">Understanding and Coding the KV Cache in LLMs from Scratch</a>
  277.                        </h2>
  278.                        <p class="post-date">Jun 17, 2025</p>
  279.                        <p class="post-description">KV caches are one of the most critical techniques for efficient inference in LLMs in production. KV caches are an important component for compute-efficient LLM inference in production. This article explains how they work conceptually and in code with a from-scratch, human-readable implementation.</p>
  280.                    </div>
  281.                </div>
  282.  
  283.                
  284.            
  285.                
  286.  
  287.                <div class="post-entry">
  288.                    
  289.                        <div class="post-hero-image">
  290.                            <img src="/images/blog/2025/coding-llms-from-the-ground-up-a-complete-course/hero.jpg" alt="Coding LLMs from the Ground Up: A Complete Course">
  291.                        </div>
  292.                    
  293.                    <div class="post-details">
  294.                        <h2 class="post-title">
  295.                            <a href="/blog/2025/coding-llms-from-the-ground-up-a-complete-course.html">Coding LLMs from the Ground Up: A Complete Course</a>
  296.                        </h2>
  297.                        <p class="post-date">May 10, 2025</p>
  298.                        <p class="post-description">Why build an LLM from scratch? It's probably the best and most efficient way to learn how LLMs really work. Plus, many readers have told me they had a lot of fun doing it.</p>
  299.                    </div>
  300.                </div>
  301.  
  302.                
  303.            
  304.                
  305.                    
  306.        </article>
  307.    </div>
  308. </div>
  309.  
  310. <!-- Styles -->
  311. <style>
  312.    .post-entry {
  313.        display: flex;
  314.        align-items: flex-start;
  315.        margin-bottom: 20px;
  316.        border-bottom: 1px solid #ddd;
  317.        padding-bottom: 20px;
  318.    }
  319.  
  320.    .post-hero-image {
  321.        flex: 0 0 120px;
  322.        margin-right: 20px;
  323.    }
  324.  
  325.    .post-hero-image img {
  326.        width: 100%;
  327.        height: auto;
  328.    }
  329.  
  330.    .post-details {
  331.        flex: 1;
  332.    }
  333.  
  334.    .post-title {
  335.        margin: 0;
  336.        font-size: 1.5em;
  337.        color: #333;
  338.    }
  339.  
  340.    .post-title a {
  341.        color: #333;
  342.        text-decoration: none;
  343.    }
  344.  
  345.    .post-title a:hover {
  346.        text-decoration: underline;
  347.        color: #0056b3;
  348.    }
  349.  
  350.    .post-date {
  351.        color: #666;
  352.        font-size: 0.9em;
  353.        margin: -4px 0;
  354.    }
  355.  
  356.    .post-description {
  357.        margin: 0;
  358.    }
  359.  
  360.    h1.post-title {
  361.        text-align: center;
  362.    }
  363.  
  364.    h2.post-title, h2.post-title a {
  365.        all: unset;
  366.        display: block;
  367.        font-size: 1.0em;
  368.        color: #333;
  369.        text-decoration: none;
  370.    }
  371.  
  372.    h2.post-title a:hover {
  373.        color: #0056b3;
  374.        text-decoration: underline;
  375.    }
  376.  
  377.    a.anchorjs-link {
  378.        display: none !important;
  379.    }
  380. </style>
  381.  
  382.      </div>
  383.    </div>
  384.  
  385.    <footer class="site-footer">
  386.  
  387.  <div class="wrapper">
  388.  
  389.  
  390.  
  391.    <div class="footer-col-wrapper">
  392.  
  393.  
  394.    <div class="footer-col  social-col">
  395.  
  396.  
  397.      
  398.      <a href="https://magazine.sebastianraschka.com"><span><i class="fa fa-rss fa-2x"></i></span> </a>
  399.      
  400.  
  401.      
  402.          <a href="/contact"><span><i class="fa fa-envelope fa-2x"></i></span> </a>
  403.      
  404.  
  405.      
  406.        <a href="https://twitter.com/rasbt"> <span><i class="fa fa-twitter fa-2x"></i></span> </a>
  407.      
  408.  
  409.      
  410.            <a href="https://youtube.com/c/SebastianRaschka"><span><i class="fa fa-youtube fa-2x"></i></span> </a>
  411.      
  412.  
  413.      
  414.            <a href="https://github.com/rasbt"><span><i class="fa fa-github fa-2x"></i> </span></a>
  415.      
  416.  
  417.      
  418.          <a href="https://scholar.google.com/citations?user=X4RCC0IAAAAJ&hl=enrasbt"><span><i class="fa fa-google fa-2x"></i> </span></a>
  419.      
  420.  
  421.      
  422.          <a href="https://linkedin.com/in/sebastianraschka"><span><i class="fa fa-linkedin fa-2x"></i> </span></a>
  423.      
  424.  
  425.  
  426.  </div>
  427.  
  428.    <div class="footer-col  copyright-col">
  429.      <p>&copy; 2013-2025 Sebastian Raschka</p>
  430.    </div>
  431.  
  432.  
  433.  
  434.  </div>
  435. </div>
  436.  
  437. <!-- Google tag (gtag.js) -->
  438. <script async src="https://www.googletagmanager.com/gtag/js?id=G-BYQXBRPK81"></script>
  439. <script>
  440.  window.dataLayer = window.dataLayer || [];
  441.  function gtag(){dataLayer.push(arguments);}
  442.  gtag('js', new Date());
  443.  
  444.  gtag('config', 'G-BYQXBRPK81');
  445. </script>
  446. </footer>
  447. </div>
  448.  
  449.  
  450.  <script src="/js/anchor.min.js" type="text/javascript"></script>
  451.  <script>
  452.    var selector = 'h2, h3, h4, h5, h6';
  453.    /*
  454.    anchors.options = {
  455.      icon: '#',
  456.      visible: 'always',
  457.      placement: 'left',
  458.      class: 'bb-anchor'
  459.    }
  460.    */
  461.    anchors.add(selector);
  462.  </script>
  463.  
  464. </body>
  465. </html>
  466.  
Copyright © 2002-9 Sam Ruby, Mark Pilgrim, Joseph Walton, and Phil Ringnalda