<?xml version="1.0" encoding="UTF-8"?>
<rss version="2.0">
  <channel>
    <title>PyPI recent updates for turbo-attn</title>
    <link>https://pypi.org/project/turbo-attn/</link>
    <description>Recent updates to the Python Package Index for turbo-attn</description>
    <language>en</language>    <item>
      <title>0.6.4</title>
      <link>https://pypi.org/project/turbo-attn/0.6.4/</link>
      <description>Optimized CUDAgraph-enabled kernels and attention backend for vLLM, SGLang and more based on TurboQuant near-lossless KV cache compression. SOTA performance with Gemma 4, Qwen 3.6 and other modern LLMs.</description>
<author>dmitri.evseev@arbi.city</author>      <pubDate>Sat, 13 Jun 2026 14:11:48 GMT</pubDate>
    </item>    <item>
      <title>0.6.3</title>
      <link>https://pypi.org/project/turbo-attn/0.6.3/</link>
      <description>Optimized CUDAgraph-enabled kernels and attention backend for vLLM, SGLang and more based on TurboQuant near-lossless KV cache compression. SOTA performance with Gemma 4, Qwen 3.6 and other modern LLMs.</description>
<author>dmitri.evseev@arbi.city</author>      <pubDate>Sat, 13 Jun 2026 00:11:03 GMT</pubDate>
    </item>    <item>
      <title>0.6.2</title>
      <link>https://pypi.org/project/turbo-attn/0.6.2/</link>
      <description>Optimized CUDAgraph-enabled kernels and attention backend for vLLM, SGLang and more based on TurboQuant near-lossless KV cache compression. SOTA performance with Gemma 4, Qwen 3.6 and other modern LLMs.</description>
<author>dmitri.evseev@arbi.city</author>      <pubDate>Fri, 12 Jun 2026 21:54:02 GMT</pubDate>
    </item>    <item>
      <title>0.6.1</title>
      <link>https://pypi.org/project/turbo-attn/0.6.1/</link>
      <description>Optimized CUDAgraph-enabled kernels and attention backend for vLLM, SGLang and more based on TurboQuant near-lossless KV cache compression. SOTA performance with Gemma 4, Qwen 3.6 and other modern LLMs.</description>
<author>dmitri.evseev@arbi.city</author>      <pubDate>Fri, 12 Jun 2026 19:43:12 GMT</pubDate>
    </item>    <item>
      <title>0.6.0</title>
      <link>https://pypi.org/project/turbo-attn/0.6.0/</link>
      <description>Optimized CUDAgraph-enabled kernels and attention backend for vLLM, SGLang and more based on TurboQuant near-lossless KV cache compression. SOTA performance with Gemma 4, Qwen 3.6 and other modern LLMs.</description>
<author>dmitri.evseev@arbi.city</author>      <pubDate>Fri, 12 Jun 2026 15:19:31 GMT</pubDate>
    </item>    <item>
      <title>0.5.1</title>
      <link>https://pypi.org/project/turbo-attn/0.5.1/</link>
      <description>Optimized CUDAgraph-enabled kernels and attention backend for vLLM, SGLang and more based on TurboQuant near-lossless KV cache compression. SOTA performance with Gemma 4, Qwen 3.6 and other modern LLMs.</description>
<author>dmitri.evseev@arbi.city</author>      <pubDate>Fri, 12 Jun 2026 15:15:25 GMT</pubDate>
    </item>    <item>
      <title>0.5.0</title>
      <link>https://pypi.org/project/turbo-attn/0.5.0/</link>
      <description>Optimized CUDAgraph-enabled kernels and attention backend for vLLM, SGLang and more based on TurboQuant near-lossless KV cache compression. SOTA performance with Gemma 4, Qwen 3.6 and other modern LLMs.</description>
<author>dmitri.evseev@arbi.city</author>      <pubDate>Thu, 11 Jun 2026 15:03:08 GMT</pubDate>
    </item>    <item>
      <title>0.4.1</title>
      <link>https://pypi.org/project/turbo-attn/0.4.1/</link>
      <description>Optimized CUDAgraph-enabled kernels and attention backend for vLLM, SGLang and more based on TurboQuant near-lossless KV cache compression. SOTA performance with Gemma 4, Qwen 3.6 and other modern LLMs.</description>
<author>dmitri.evseev@arbi.city</author>      <pubDate>Thu, 11 Jun 2026 05:09:05 GMT</pubDate>
    </item>    <item>
      <title>0.4.0</title>
      <link>https://pypi.org/project/turbo-attn/0.4.0/</link>
      <description>Optimized CUDAgraph-enabled kernels and attention backend for vLLM, SGLang and more based on TurboQuant near-lossless KV cache compression. SOTA performance with Gemma 4, Qwen 3.6 and other modern LLMs.</description>
<author>dmitri.evseev@arbi.city</author>      <pubDate>Wed, 10 Jun 2026 21:20:08 GMT</pubDate>
    </item>    <item>
      <title>0.3.2</title>
      <link>https://pypi.org/project/turbo-attn/0.3.2/</link>
      <description>Optimized CUDAgraph-enabled kernels and attention backend for vLLM, SGLang and more based on TurboQuant near-lossless KV cache compression. SOTA performance with Gemma 4, Qwen 3.6 and other modern LLMs.</description>
<author>dmitri.evseev@arbi.city</author>      <pubDate>Wed, 10 Jun 2026 20:43:15 GMT</pubDate>
    </item>    <item>
      <title>0.3.0</title>
      <link>https://pypi.org/project/turbo-attn/0.3.0/</link>
      <description>Optimized CUDAgraph-enabled kernels and attention backend for vLLM, SGLang and more based on TurboQuant near-lossless KV cache compression. SOTA performance with Gemma 4, Qwen 3.6 and other modern LLMs.</description>
<author>dmitri.evseev@arbi.city</author>      <pubDate>Wed, 10 Jun 2026 19:09:17 GMT</pubDate>
    </item>    <item>
      <title>0.3.1</title>
      <link>https://pypi.org/project/turbo-attn/0.3.1/</link>
      <description>Optimized CUDAgraph-enabled kernels and attention backend for vLLM, SGLang and more based on TurboQuant near-lossless KV cache compression. SOTA performance with Gemma 4, Qwen 3.6 and other modern LLMs.</description>
<author>dmitri.evseev@arbi.city</author>      <pubDate>Wed, 10 Jun 2026 19:09:14 GMT</pubDate>
    </item>    <item>
      <title>0.2.0</title>
      <link>https://pypi.org/project/turbo-attn/0.2.0/</link>
      <description>Optimized CUDAgraph-enabled kernels and attention backend for vLLM, SGLang and more based on TurboQuant near-lossless KV cache compression. SOTA performance with Gemma 4, Qwen 3.6 and other modern LLMs.</description>
<author>dmitri.evseev@arbi.city</author>      <pubDate>Tue, 02 Jun 2026 19:33:14 GMT</pubDate>
    </item>    <item>
      <title>0.1.2</title>
      <link>https://pypi.org/project/turbo-attn/0.1.2/</link>
      <description>Optimized CUDAgraph-enabled kernels and attention backend for vLLM, SGLang and more based on TurboQuant near-lossless KV cache compression. SOTA performance with Gemma 4, Qwen 3.6 and other modern LLMs.</description>
<author>dmitri.evseev@arbi.city</author>      <pubDate>Thu, 30 Apr 2026 20:20:38 GMT</pubDate>
    </item>    <item>
      <title>0.1.1</title>
      <link>https://pypi.org/project/turbo-attn/0.1.1/</link>
      <description>Optimized CUDAgraph-enabled kernels and attention backend for vLLM, SGLang and more based on TurboQuant near-lossless KV cache compression. SOTA performance with Gemma 4, Qwen 3.6 and other modern LLMs.</description>
<author>dmitri.evseev@arbi.city</author>      <pubDate>Thu, 30 Apr 2026 19:49:21 GMT</pubDate>
    </item>    <item>
      <title>0.1.0</title>
      <link>https://pypi.org/project/turbo-attn/0.1.0/</link>
      <description>Productionized TurboQuant KV cache compression for vLLM and SGLang (imported as `tqkv`)</description>
<author>dmitri.evseev@arbi.city</author>      <pubDate>Thu, 30 Apr 2026 19:41:29 GMT</pubDate>
    </item>  </channel>
</rss>