<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom" xmlns:dc="http://purl.org/dc/elements/1.1/">
  <channel>
    <title>Forem: Stephanie</title>
    <description>The latest articles on Forem by Stephanie (@stephaniespanjian).</description>
    <link>https://forem.com/stephaniespanjian</link>
    <image>
      <url>https://media2.dev.to/dynamic/image/width=90,height=90,fit=cover,gravity=auto,format=auto/https:%2F%2Fdev-to-uploads.s3.amazonaws.com%2Fuploads%2Fuser%2Fprofile_image%2F3793081%2Fa0002f58-017e-418f-b195-8196b9a361ad.JPG</url>
      <title>Forem: Stephanie</title>
      <link>https://forem.com/stephaniespanjian</link>
    </image>
    <atom:link rel="self" type="application/rss+xml" href="https://forem.com/feed/stephaniespanjian"/>
    <language>en</language>
    <item>
      <title>RAG on a Budget: How I Replaced a $360/Month OpenSearch Cluster with S3 and In-Memory Search</title>
      <dc:creator>Stephanie</dc:creator>
      <pubDate>Thu, 26 Feb 2026 00:32:31 +0000</pubDate>
      <link>https://forem.com/stephaniespanjian/rag-on-a-budget-how-i-replaced-a-360month-opensearch-cluster-with-s3-and-in-memory-search-5eek</link>
      <guid>https://forem.com/stephaniespanjian/rag-on-a-budget-how-i-replaced-a-360month-opensearch-cluster-with-s3-and-in-memory-search-5eek</guid>
      <description>&lt;p&gt;I shelved a project in March 2025 because it cost $360/month to run.&lt;/p&gt;

&lt;p&gt;I rebuilt it in January 2026 for $1.12/month.&lt;/p&gt;

&lt;p&gt;Same functionality. Better architecture. No vector database.&lt;/p&gt;

&lt;p&gt;It's a RAG pipeline — API Gateway → Lambda → Amazon Bedrock → S3 embeddings → in-memory cosine similarity search. It lives on my site and answers questions about my experience and work history in real time, grounded in structured data I built and curated myself.&lt;/p&gt;

&lt;p&gt;The interesting parts: &lt;br&gt;
— Why I killed OpenSearch after less than a week &lt;br&gt;
— How in-memory search outperformed a network call at this scale &lt;br&gt;
— The Anthropic/Bedrock access issue I still haven't fully resolved (Llama works fine) &lt;br&gt;
— Why I handcrafted every knowledge base chunk instead of automating it&lt;br&gt;
Full write-up: &lt;a href="https://stephaniespanjian.com/blog/rag-cost-reduction-replaced-opensearch-s3-in-memory-search" rel="noopener noreferrer"&gt;https://stephaniespanjian.com/blog/rag-cost-reduction-replaced-opensearch-s3-in-memory-search&lt;/a&gt;&lt;/p&gt;

</description>
      <category>ai</category>
      <category>aws</category>
      <category>bedrock</category>
      <category>systemdesign</category>
    </item>
  </channel>
</rss>
