<?xml version="1.0"?>
<rss version="2.0" xmlns:media="http://search.yahoo.com/mrss/" xmlns:atom="http://www.w3.org/2005/Atom" xmlns:neowin="https://www.neowin.net/">
	<channel>
		<title>Neowin News Feed for: Tensorrt</title>
		<link>https://www.neowin.net/news/tag/tensorrt/</link>
        <atom:link href="https://www.neowin.net/news/rss/tensorrt/" rel="self" type="application/rss+xml" />
		<description>Neowin News Feed for: Tensorrt</description>
		<language>en-us</language>
		<generator>Neowin Ignition News</generator>
		<managingEditor>editor@neowin.net (Managing Editor)</managingEditor>
		<webMaster>developers@neowin.net (Neowin Developers)</webMaster>
		<ttl>5</ttl>
		<image>
			<title>Neowin.net</title>
			<url>https://www.neowin.net/images/pegasus/icon.png</url>
			<link>https://www.neowin.net</link>
		</image>
		        <item>
            <title>NVIDIA announces TensorRT-LLM for Windows that boosts LLMs by up to 4 times with RTX GPUs</title>
            <link>https://www.neowin.net/news/nvidia-announces-tensorrt-llm-for-windows-that-boosts-llms-by-up-to-4-times-with-rtx-gpus/</link>
            <description>&lt;div style="float:left;margin-right:10px;"&gt;&lt;img src="https://cdn.neowin.com/news/images/uploaded/2020/02/1581165737_nvidia-logo-1280x637_medium.jpg" alt="" /&gt;&lt;/div&gt;NVIDIA has announced TensorRT-LLM for Windows. This open-source library will allow PC developers with NVIDIA GeForce RTX graphics cards to boost the performance of LLMs by up to four times. &lt;a href="https://www.neowin.net/news/nvidia-announces-tensorrt-llm-for-windows-that-boosts-llms-by-up-to-4-times-with-rtx-gpus/"&gt;Read more...&lt;/a&gt;</description>
            <author>John Callaham</author>
            <pubDate>Tue, 17 Oct 2023 20:50:01 +0000</pubDate>
            <guid>https://www.neowin.net/news/nvidia-announces-tensorrt-llm-for-windows-that-boosts-llms-by-up-to-4-times-with-rtx-gpus/</guid>
            <media:thumbnail url="https://cdn.neowin.com/news/images/uploaded/2020/02/1581165737_nvidia-logo-1280x637_story.jpg" width="760" height="428" />
            <neowin:tags>#NVIDIA #TensorRT-LLM</neowin:tags>            <neowin:twitter>@JCalNEO</neowin:twitter>        </item>
                <item>
            <title>Nvidia announces TensorRT 8, slashes BERT inference times down to a millisecond</title>
            <link>https://www.neowin.net/news/nvidia-announces-tensorrt-8-slashes-bert-inference-times-down-to-a-millisecond/</link>
            <description>&lt;div style="float:left;margin-right:10px;"&gt;&lt;img src="https://cdn.neowin.com/news/images/uploaded/2021/07/1626779149_nvidia_header_medium.jpg" alt="" /&gt;&lt;/div&gt;Providing over twice the precision and inference speed compared to the last generation, Nvidia&amp;#039;s new TensorRT 8 deep learning SDK clocked in a time of 1.2 ms in BERT-Large&amp;#039;s inference. &lt;a href="https://www.neowin.net/news/nvidia-announces-tensorrt-8-slashes-bert-inference-times-down-to-a-millisecond/"&gt;Read more...&lt;/a&gt;</description>
            <author>Ather Fawaz</author>
            <pubDate>Tue, 20 Jul 2021 13:00:01 +0000</pubDate>
            <guid>https://www.neowin.net/news/nvidia-announces-tensorrt-8-slashes-bert-inference-times-down-to-a-millisecond/</guid>
            <media:thumbnail url="https://cdn.neowin.com/news/images/uploaded/2021/07/1626779149_nvidia_header_story.jpg" width="760" height="428" />
            <neowin:tags>#Nvidia #TensorRT8 #AI #ML</neowin:tags>            <neowin:twitter>@AtherFawaz</neowin:twitter>        </item>
        	</channel>
</rss>
