<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0">
  <channel>
    <title>Local AI Inference - Sesame Disk</title>
    <link>https://sesamedisk.com/category/local-ai-inference/</link>
    <description>Articles about Local AI Inference from Sesame Disk.</description>
    <language>en-us</language>
    <item>
      <title>In 2026, the Decision Among Local Inference Engines Comes Down to One Question</title>
      <link>https://sesamedisk.com/llamacpp-vs-vllm-vs-sglang-vs-ollama-2026/</link>
      <description>Discover the key factors influencing local AI inference engine choices in 2026, including performance, security, and architectural considerations for…</description>
      <pubDate>Fri, 19 Jun 2026 11:55:08 +0000</pubDate>
      <guid>https://sesamedisk.com/llamacpp-vs-vllm-vs-sglang-vs-ollama-2026/</guid>
      <category>AI &amp; Emerging Technology</category>
      <category>Local AI Inference</category>
      <category>Open Source Infrastructure</category>
    </item>
    <item>
      <title>2026 Hardware Showdown: GPU and ASIC Performance for LLM Inference</title>
      <link>https://sesamedisk.com/llm-inference-hardware-2026-comparison/</link>
      <description>Compare 2026 performance claims of GPU and ASIC platforms for LLM inference, analyzing throughput, power, and deployment implications to inform your…</description>
      <pubDate>Tue, 09 Jun 2026 00:02:45 +0000</pubDate>
      <guid>https://sesamedisk.com/llm-inference-hardware-2026-comparison/</guid>
      <category>Local AI Inference</category>
      <category>Semiconductor Innovation</category>
      <category>Software Development</category>
    </item>
    <item>
      <title>Top Local AI Inference Engines in 2026: Features and Use Cases</title>
      <link>https://sesamedisk.com/local-inference-engines-2026-comparison/</link>
      <description>Compare top local inference engines for LLMs in 2026: Ollama, llama.cpp, vLLM, TGI, and SGLang. Find the best local inference engine 2026 for your hardware and workload.</description>
      <pubDate>Wed, 20 May 2026 00:03:15 +0000</pubDate>
      <guid>https://sesamedisk.com/local-inference-engines-2026-comparison/</guid>
      <category>AI &amp; Emerging Technology</category>
      <category>Local AI Inference</category>
    </item>
    <item>
      <title>Quantization Techniques for AI Inference in 2026: GGUF, AWQ, GPTQ, and FP8</title>
      <link>https://sesamedisk.com/quantization-techniques-ai-inference-2026/</link>
      <description>Explore the latest in quantization techniques for local AI inference in 2026, comparing GGUF, AWQ, GPTQ, and FP8 formats to optimize model performance and…</description>
      <pubDate>Thu, 14 May 2026 09:19:36 +0000</pubDate>
      <guid>https://sesamedisk.com/quantization-techniques-ai-inference-2026/</guid>
      <category>AI &amp; Emerging Technology</category>
      <category>Local AI Inference</category>
      <category>Storage</category>
      <category>Tech Markets</category>
    </item>
  </channel>
</rss>