<?xml version="1.0" encoding="utf-8" standalone="yes"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  <channel>
    <title>AI Search on Jamie Ede</title>
    <link>https://www.jamieede.com/tags/ai-search/</link>
    <description>Recent content in AI Search on Jamie Ede</description>
    <generator>Hugo</generator>
    <language>en-us</language>
    <lastBuildDate>Fri, 05 Jun 2026 11:00:00 +0000</lastBuildDate>
    <atom:link href="https://www.jamieede.com/tags/ai-search/index.xml" rel="self" type="application/rss+xml" />
    <item>
      <title>The local OCR that scored best, and let the chatbot show the diagrams</title>
      <link>https://www.jamieede.com/posts/docling-rapidocr-inline-figures-service-manual-rag/</link>
      <pubDate>Fri, 05 Jun 2026 11:00:00 +0000</pubDate>
      <guid>https://www.jamieede.com/posts/docling-rapidocr-inline-figures-service-manual-rag/</guid>
      <description>&lt;p&gt;In the &lt;a href=&#34;https://www.jamieede.com/posts/measuring-ocr-accuracy-1994-service-manual-rag/&#34; &gt;last post&lt;/a&gt;&#xA; I built a strict exact-match test for the OCR behind a 1994 Yamaha XV250 Virago manual chatbot and scored four local pipelines against 100 hand-verified values. The live corpus (Docling running EasyOCR) scored 61 percent; the best of the four was &lt;strong&gt;Docling + RapidOCR at 85 percent&lt;/strong&gt;, and it got there doing genuine OCR on the page pixels, with nothing leaving the machine and no per-page API bill.&lt;/p&gt;</description>
    </item>
  </channel>
</rss>
