From e35a6592f53ee34b1ec2fc3f1e009dd1ebc79e65 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Piotr=20=C5=BBelasko?= <petezor@gmail.com>
Date: Wed, 25 Sep 2024 16:02:46 -0400
Subject: [PATCH] Add inference optimization blog post announcement to README
 (#10623)
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Signed-off-by: Piotr Żelasko <petezor@gmail.com>
---
 README.md | 10 ++++++++++
 1 file changed, 10 insertions(+)
diff --git a/README.md b/README.md
index 9b019d3ac175..f229cfb637ea 100644
--- a/README.md
+++ b/README.md
@@ -78,6 +78,16 @@
 
 <details open>
   <summary><b>Speech Recognition</b></summary>
+  <details>
+      <summary>
+        <a href="https://developer.nvidia.com/blog/accelerating-leaderboard-topping-asr-models-10x-with-nvidia-nemo/">
+          Accelerating Leaderboard-Topping ASR Models 10x with NVIDIA NeMo
+        </a> (2024/09/24)
+      </summary>
+      NVIDIA NeMo team released a number of inference optimizations for CTC, RNN-T, and TDT models that resulted in up to 10x inference speed-up. 
+      These models now exceed an inverse real-time factor (RTFx) of 2,000, with some reaching RTFx of even 6,000.
+      <br><br>
+    </details>
     <details>
       <summary>
         <a href="https://developer.nvidia.com/blog/new-standard-for-speech-recognition-and-translation-from-the-nvidia-nemo-canary-model/">