<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
<channel>
  <title>Tom F - Writing</title>
  <link>https://tomtomtech.net/writing</link>
  <description>Notes on retrieval, evals, agent infrastructure, and shipping systems that keep working.</description>
  <language>en-us</language>
  <atom:link href="https://tomtomtech.net/rss.xml" rel="self" type="application/rss+xml" />
  <item>
    <title>A refusal-eval rubric for grounded document QA</title>
    <link>https://tomtomtech.net/writing/refusal-eval-harness</link>
    <guid isPermaLink="true">https://tomtomtech.net/writing/refusal-eval-harness</guid>
    <description>Four buckets, one table, and why &quot;correct&quot; is the least interesting score in the set</description>
    <pubDate>Sun, 05 Apr 2026 00:00:00 GMT</pubDate>
    <category>ai</category>
    <category>rag</category>
    <category>evals</category>
    <category>refusal</category>
  </item>
  <item>
    <title>System-design notes from shipping hosted LLM workloads</title>
    <link>https://tomtomtech.net/writing/shipping-hosted-llms</link>
    <guid isPermaLink="true">https://tomtomtech.net/writing/shipping-hosted-llms</guid>
    <description>Prompt caching, tool-use loops, structured output, and the failure modes that show up in regulated deployments</description>
    <pubDate>Sun, 22 Mar 2026 00:00:00 GMT</pubDate>
    <category>ai</category>
    <category>system-design</category>
    <category>tool-use</category>
  </item>
  <item>
    <title>Notes on designing a protocol-native agent eval substrate</title>
    <link>https://tomtomtech.net/writing/agent-eval-harness</link>
    <guid isPermaLink="true">https://tomtomtech.net/writing/agent-eval-harness</guid>
    <description>Why the wire protocol is the right place to draw the eval boundary</description>
    <pubDate>Sat, 28 Feb 2026 00:00:00 GMT</pubDate>
    <category>ai</category>
    <category>agents</category>
    <category>a2a</category>
    <category>evals</category>
  </item>
  <item>
    <title>What it actually takes to run unattended for a year</title>
    <link>https://tomtomtech.net/writing/unattended-for-a-year</link>
    <guid isPermaLink="true">https://tomtomtech.net/writing/unattended-for-a-year</guid>
    <description>The single design constraint that reshapes every other decision</description>
    <pubDate>Fri, 20 Feb 2026 00:00:00 GMT</pubDate>
    <category>systems</category>
    <category>reliability</category>
    <category>ops</category>
  </item>
  <item>
    <title>Rust, Go, and the distribution-vs-guarantees matrix</title>
    <link>https://tomtomtech.net/writing/rust-go-distribution-matrix</link>
    <guid isPermaLink="true">https://tomtomtech.net/writing/rust-go-distribution-matrix</guid>
    <description>When Rust is the right choice, when Go is, and why the honest answer is &quot;it depends on which problem you&apos;re solving&quot;</description>
    <pubDate>Sun, 18 Jan 2026 00:00:00 GMT</pubDate>
    <category>rust</category>
    <category>go</category>
    <category>systems</category>
    <category>language-choice</category>
  </item>
</channel>
</rss>
