<?xml version="1.0" encoding="utf-8" standalone="yes"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  <channel>
    <title>Vllm on Amit Agarwal Linux Blog</title>
    <link>/tags/vllm/</link>
    <description>Recent content in Vllm on Amit Agarwal Linux Blog</description>
    <generator>Hugo -- gohugo.io</generator>
    <language>en</language>
    <lastBuildDate>Thu, 25 Dec 2025 00:00:00 +0530</lastBuildDate>
    
	<atom:link href="/tags/vllm/index.xml" rel="self" type="application/rss+xml" />
    
    
    <item>
      <title>Run a Local LLM API Server with vLLM (OpenAI-Compatible, Fast, and Simple)</title>
      <link>/2025/12/25/2025-12-25-local_vllm/</link>
      <pubDate>Thu, 25 Dec 2025 00:00:00 +0530</pubDate>
      
      <guid>/2025/12/25/2025-12-25-local_vllm/</guid>
      <description>Step-by-step: create a uv virtualenv, install vLLM with the right torch backend, and launch &lt;code&gt;vllm serve&lt;/code&gt; to get an OpenAI-compatible local API endpoint.</description>
    </item>
    
  </channel>
</rss>
