<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0">
  <channel>
    <title>Sai Anirudh Siddi — Writing</title>
    <link>https://www.saianirudh.blog/blog</link>
    <description>Sai Anirudh Siddi — AI Engineer working on ML systems, LLMs, model evaluation and SaaS. Projects, writing, and experience.</description>
    <language>en-us</language>
    <item>
      <title>Probing medical LLMs for overconfidence</title>
      <link>https://www.saianirudh.blog/blog/probing-medical-llms-for-overconfidence</link>
      <guid>https://www.saianirudh.blog/blog/probing-medical-llms-for-overconfidence</guid>
      <description>Training a persona-vector probe that reads overconfidence straight off a medical LLM's activations — and the two changes that moved AUROC from chance to 0.88.</description>
      <pubDate>Thu, 28 May 2026 00:00:00 GMT</pubDate>
    </item>
    <item>
      <title>From 0.50 to 0.88 AUROC with activation normalization</title>
      <link>https://www.saianirudh.blog/blog/auroc-from-half-to-088</link>
      <guid>https://www.saianirudh.blog/blog/auroc-from-half-to-088</guid>
      <description>A short note on why normalizing residual-stream activations before a linear probe is the single highest-leverage change for behavioral detection in LLMs.</description>
      <pubDate>Mon, 04 May 2026 00:00:00 GMT</pubDate>
    </item>
    <item>
      <title>Monitoring interpretability in production</title>
      <link>https://www.saianirudh.blog/blog/monitoring-interpretability-in-production</link>
      <guid>https://www.saianirudh.blog/blog/monitoring-interpretability-in-production</guid>
      <description>Interpretability isn't just an offline research tool — wiring feature activations into Arize Phoenix and Sentry turns it into a live safety signal.</description>
      <pubDate>Sun, 12 Apr 2026 00:00:00 GMT</pubDate>
    </item>
    <item>
      <title>What I learned building ExoSeeker</title>
      <link>https://www.saianirudh.blog/blog/what-i-learned-building-exoseeker</link>
      <guid>https://www.saianirudh.blog/blog/what-i-learned-building-exoseeker</guid>
      <description>Lessons from building an AI exoplanet-detection pipeline on NASA Kepler data that hit &gt;90% accuracy and won Best Use of NASA Data.</description>
      <pubDate>Wed, 15 Jan 2025 00:00:00 GMT</pubDate>
    </item>
  </channel>
</rss>