<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:dc="http://purl.org/dc/elements/1.1/" version="2.0">
  <channel>
    <title>InfoQ - Distributed Programming - News</title>
    <link>https://www.infoq.com</link>
    <description>InfoQ Distributed Programming News feed</description>
    <item>
      <title>Microsoft Releases DeepSpeed-FastGen for High-Throughput Text Generation</title>
      <link>https://www.infoq.com/news/2023/11/microsoft-releases-dsfastgen/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Distributed+Programming-news</link>
      <description>&lt;img src="https://res.infoq.com/news/2023/11/microsoft-releases-dsfastgen/en/headerimage/header%281%29-1699209225367.jpg"/&gt;&lt;p&gt;Microsoft has announced the alpha release of DeepSpeed-FastGen, a system designed to improve the deployment and serving of large language models (LLMs). DeepSpeed-FastGen is the synergistic composition of DeepSpeed-MII and DeepSpeed-Inference . DeepSpeed-FastGen is based on the Dynamic SplitFuse technique. The system currently supports several model architectures.&lt;/p&gt; &lt;i&gt;By Andrew Hoblitzell&lt;/i&gt;</description>
      <category>Microsoft</category>
      <category>Distributed Programming</category>
      <category>Deep Learning</category>
      <category>GPU</category>
      <category>Machine Learning</category>
      <category>Development</category>
      <category>AI, ML &amp; Data Engineering</category>
      <category>news</category>
      <pubDate>Tue, 07 Nov 2023 17:56:00 GMT</pubDate>
      <guid>https://www.infoq.com/news/2023/11/microsoft-releases-dsfastgen/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Distributed+Programming-news</guid>
      <dc:creator>Andrew Hoblitzell</dc:creator>
      <dc:date>2023-11-07T17:56:00Z</dc:date>
      <dc:identifier>/news/2023/11/microsoft-releases-dsfastgen/en</dc:identifier>
    </item>
  </channel>
</rss>
