<?xml version="1.0"?>
<rss version="2.0" xmlns:media="http://search.yahoo.com/mrss/" xmlns:atom="http://www.w3.org/2005/Atom" xmlns:neowin="https://www.neowin.net/">
	<channel>
		<title>Neowin News Feed for: Inference</title>
		<link>https://www.neowin.net/news/tag/inference/</link>
        <atom:link href="https://www.neowin.net/news/rss/inference/" rel="self" type="application/rss+xml" />
		<description>Neowin News Feed for: Inference</description>
		<language>en-us</language>
		<generator>Neowin Ignition News</generator>
		<managingEditor>editor@neowin.net (Managing Editor)</managingEditor>
		<webMaster>developers@neowin.net (Neowin Developers)</webMaster>
		<ttl>5</ttl>
		<image>
			<title>Neowin.net</title>
			<url>https://www.neowin.net/images/pegasus/icon.png</url>
			<link>https://www.neowin.net</link>
		</image>
		        <item>
            <title>Google&#039;s new method makes LLMs faster and more powerful, and cheaper too</title>
            <link>https://www.neowin.net/news/googles-new-method-makes-llms-faster-and-more-powerful-and-cheaper-too/</link>
            <description>&lt;div style="float:left;margin-right:10px;"&gt;&lt;img src="https://cdn.neowin.com/news/images/uploaded/2025/08/1756531195_gemini_medium.webp" alt="" /&gt;&lt;/div&gt;Google Research has developed a new method that could make running large language models cheaper and faster. Here&amp;#039;s what it has done. &lt;a href="https://www.neowin.net/news/googles-new-method-makes-llms-faster-and-more-powerful-and-cheaper-too/"&gt;Read more...&lt;/a&gt;</description>
            <author>Paul Hill</author>
            <pubDate>Fri, 12 Sep 2025 14:12:01 +0000</pubDate>
            <guid>https://www.neowin.net/news/googles-new-method-makes-llms-faster-and-more-powerful-and-cheaper-too/</guid>
            <media:thumbnail url="https://cdn.neowin.com/news/images/uploaded/2025/08/1756531195_gemini_story.webp" width="760" height="428" />
            <neowin:tags>#Google #Research #LLMs</neowin:tags>            <neowin:twitter>@ziks_99</neowin:twitter>        </item>
                <item>
            <title>Nvidia announces its most powerful GPU, the Blackwell Ultra, built for training agentic AI</title>
            <link>https://www.neowin.net/news/nvidia-announces-its-most-powerful-gpu-the-blackwell-ultra-built-for-training-agentic-ai/</link>
            <description>&lt;div style="float:left;margin-right:10px;"&gt;&lt;img src="https://cdn.neowin.com/news/images/uploaded/2025/05/1747646100_nvidia_grace_blackwell_medium.jpg" alt="" /&gt;&lt;/div&gt;Nvidia has announced its latest GPU, the Blackwell Ultra, made to train the next generation of AI models.  &lt;a href="https://www.neowin.net/news/nvidia-announces-its-most-powerful-gpu-the-blackwell-ultra-built-for-training-agentic-ai/"&gt;Read more...&lt;/a&gt;</description>
            <author>Karthik Mudaliar</author>
            <pubDate>Mon, 19 May 2025 09:28:02 +0000</pubDate>
            <guid>https://www.neowin.net/news/nvidia-announces-its-most-powerful-gpu-the-blackwell-ultra-built-for-training-agentic-ai/</guid>
            <media:thumbnail url="https://cdn.neowin.com/news/images/uploaded/2025/05/1747646100_nvidia_grace_blackwell_story.jpg" width="760" height="428" />
            <neowin:tags>#Nvidia #Blackwell #Ultra</neowin:tags>            <neowin:twitter>@heykarthikm</neowin:twitter>        </item>
                <item>
            <title>Cerebras launches the world&#039;s fastest AI inference, 20X performance compared to NVIDIA</title>
            <link>https://www.neowin.net/news/cerebras-launches-the-worlds-fastest-ai-inference-20x-performance-compared-to-nvidia/</link>
            <description>&lt;div style="float:left;margin-right:10px;"&gt;&lt;img src="https://cdn.neowin.com/news/images/uploaded/2024/08/1724784526_cerebras_inference_medium.jpg" alt="" /&gt;&lt;/div&gt;Cerebras Systems launched Cerebras Inference, the world&amp;#039;s fastest AI inference solution. It&amp;#039;s 20x faster than NVIDIA&amp;#039;s solutions and offers 100x higher price-performance. &lt;a href="https://www.neowin.net/news/cerebras-launches-the-worlds-fastest-ai-inference-20x-performance-compared-to-nvidia/"&gt;Read more...&lt;/a&gt;</description>
            <author>Pradeep Viswanathan</author>
            <pubDate>Tue, 27 Aug 2024 19:20:01 +0000</pubDate>
            <guid>https://www.neowin.net/news/cerebras-launches-the-worlds-fastest-ai-inference-20x-performance-compared-to-nvidia/</guid>
            <media:thumbnail url="https://cdn.neowin.com/news/images/uploaded/2024/08/1724784526_cerebras_inference_story.jpg" width="760" height="428" />
            <neowin:tags>#Cerebras #NVIDIA #AI #LLMs</neowin:tags>            <neowin:twitter>@pradeepviswav</neowin:twitter>        </item>
                <item>
            <title>Google is making on-device machine learning easier on Android later this year</title>
            <link>https://www.neowin.net/news/google-is-making-on-device-machine-learning-easier-on-android-later-this-year/</link>
            <description>&lt;div style="float:left;margin-right:10px;"&gt;&lt;img src="https://cdn.neowin.com/news/images/uploaded/2017/11/1510041776_robot_medium.jpg" alt="" /&gt;&lt;/div&gt;Google has announced the Android ML Platform. Coming this year, it will make on-device inference easier by offering a consistent API and deeper integration with the OS without too many dependencies. &lt;a href="https://www.neowin.net/news/google-is-making-on-device-machine-learning-easier-on-android-later-this-year/"&gt;Read more...&lt;/a&gt;</description>
            <author>Usama Jawad</author>
            <pubDate>Fri, 09 Jul 2021 17:38:52 +0000</pubDate>
            <guid>https://www.neowin.net/news/google-is-making-on-device-machine-learning-easier-on-android-later-this-year/</guid>
            <media:thumbnail url="https://cdn.neowin.com/news/images/uploaded/2017/11/1510041776_robot_story.jpg" width="760" height="428" />
            <neowin:tags>#AndroidMLPlatform</neowin:tags>            <neowin:twitter>@UsamaJawad96</neowin:twitter>        </item>
                <item>
            <title>Mipsology partners with OKI IDS to bring FPGA-accelerated ML applications to Japan</title>
            <link>https://www.neowin.net/news/mipsology-partners-with-oki-ids-to-bring-fpga-accelerated-ml-applications-to-japan/</link>
            <description>&lt;div style="float:left;margin-right:10px;"&gt;&lt;img src="https://cdn.neowin.com/news/images/uploaded/2020/11/1604981411_cert-bae_medium.jpg" alt="" /&gt;&lt;/div&gt;Japanese software development firm OKI IDS will be combining its expertise with Mipsology&amp;#039;s field-programmable gate arrays to bring high-quality machine learning applications to Japan. &lt;a href="https://www.neowin.net/news/mipsology-partners-with-oki-ids-to-bring-fpga-accelerated-ml-applications-to-japan/"&gt;Read more...&lt;/a&gt;</description>
            <author>Ather Fawaz</author>
            <pubDate>Tue, 10 Nov 2020 05:00:01 +0000</pubDate>
            <guid>https://www.neowin.net/news/mipsology-partners-with-oki-ids-to-bring-fpga-accelerated-ml-applications-to-japan/</guid>
            <media:thumbnail url="https://cdn.neowin.com/news/images/uploaded/2020/11/1604981411_cert-bae_story.jpg" width="760" height="428" />
            <neowin:tags>#Mipsology #OKIIDS #FPGA</neowin:tags>            <neowin:twitter>@AtherFawaz</neowin:twitter>        </item>
        	</channel>
</rss>
