<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:dc="http://purl.org/dc/elements/1.1/" version="2.0">
  <channel>
    <title>InfoQ - Mobile - News</title>
    <link>https://www.infoq.com</link>
    <description>InfoQ Mobile News feed</description>
    <item>
      <title>Google LiteRT-LM Speeds Up Local Inference Up to 2.2x With Gemma 4 Multi-Token Prediction</title>
      <link>https://www.infoq.com/news/2026/06/google-litertlm-gemma4/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Mobile-news</link>
      <description>&lt;img src="https://res.infoq.com/news/2026/06/google-litertlm-gemma4/en/headerimage/google-litert-ml-gemma4-1780649451174.jpeg"/&gt;&lt;p&gt;LiteRT-LM brings native support for Gemma 4 Multi-Token Prediction (MTP) drafters, enabling up to 2.2x faster inference. The framework is expanding beyond Kotlin and C++ adding support for new Swift and a JavaScript APIs.&lt;/p&gt; &lt;i&gt;By Sergio De Simone&lt;/i&gt;</description>
      <category>TensorFlow</category>
      <category>Large language models</category>
      <category>Google</category>
      <category>Gemma</category>
      <category>Edge Computing</category>
      <category>Mobile</category>
      <category>Agents</category>
      <category>AI, ML &amp; Data Engineering</category>
      <category>Development</category>
      <category>news</category>
      <pubDate>Fri, 05 Jun 2026 09:00:00 GMT</pubDate>
      <guid>https://www.infoq.com/news/2026/06/google-litertlm-gemma4/?utm_campaign=infoq_content&amp;utm_source=infoq&amp;utm_medium=feed&amp;utm_term=Mobile-news</guid>
      <dc:creator>Sergio De Simone</dc:creator>
      <dc:date>2026-06-05T09:00:00Z</dc:date>
      <dc:identifier>/news/2026/06/google-litertlm-gemma4/en</dc:identifier>
    </item>
  </channel>
</rss>
