<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0" xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:atom="http://www.w3.org/2005/Atom">
  <channel>
    <title>2xStudio Engineering Blog</title>
    <description>Engineering insights on building production AI agents, full-stack applications, and automation systems.</description>
    <link>https://www.2xstudio.in/blog</link>
    <atom:link href="https://www.2xstudio.in/feed.xml" rel="self" type="application/rss+xml" />
    <language>en-US</language>
    <lastBuildDate>Wed, 10 Jun 2026 04:37:30 GMT</lastBuildDate>
    <image>
      <url>https://www.2xstudio.in/og-image.png</url>
      <title>2xStudio Engineering Blog</title>
      <link>https://www.2xstudio.in/blog</link>
    </image>
    
    <item>
      <title><![CDATA[How to Evaluate Whether Your LLM Is Actually Giving the Right Answer]]></title>
      <description><![CDATA[A detailed guide to evaluating LLM outputs using exact match, semantic checks, factuality, human review, and production-ready scoring pipelines.]]></description>
      <link>https://www.2xstudio.in/blog/how-to-evaluate-llm-outputs</link>
      <guid isPermaLink="true">https://www.2xstudio.in/blog/how-to-evaluate-llm-outputs</guid>
      <pubDate>Tue, 26 May 2026 00:00:00 GMT</pubDate>
      <author>Sumit Kumar</author>
      <category>LLM evaluation</category>
      <category>evaluate LLM output</category>
      <category>how to evaluate language models</category>
      <category>LLM accuracy</category>
      <category>RAG evaluation</category>
      <category>LLM hallucination detection</category>
      <category>LLM as judge</category>
      <category>semantic similarity evaluation</category>
      <category>AI output quality</category>
      <category>production LLM pipeline</category>
      <category>factual correctness LLM</category>
      <category>LLM scoring metrics</category>
    </item>

    <item>
      <title><![CDATA[Building Production AI Agents: A Practical Guide]]></title>
      <description><![CDATA[Lessons from shipping multi-agent systems in production — architecture, tool-calling patterns, observability, and the failure modes that actually matter.]]></description>
      <link>https://www.2xstudio.in/blog/building-production-ai-agents</link>
      <guid isPermaLink="true">https://www.2xstudio.in/blog/building-production-ai-agents</guid>
      <pubDate>Wed, 20 May 2026 00:00:00 GMT</pubDate>
      <author>Sumit Kumar</author>
      <category>AI Agents</category>
      <category>Architecture</category>
      <category>LLMs</category>
      <category>Production</category>
    </item>
  </channel>
</rss>