From 3b685e2629c5763352100c11c80e03fec7ebae47 Mon Sep 17 00:00:00 2001
From: Andres Marafioti <andimarafioti@gmail.com>
Date: Wed, 28 Aug 2024 12:02:47 +0200
Subject: [PATCH] add comment to clarify more

---
 STT/whisper_stt_handler.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/STT/whisper_stt_handler.py b/STT/whisper_stt_handler.py
index b1596a9..1470bfb 100644
--- a/STT/whisper_stt_handler.py
+++ b/STT/whisper_stt_handler.py
@@ -66,6 +66,7 @@ class WhisperSTTHandler(BaseHandler):
         if self.compile_mode not in (None, "default"):
             # generating more tokens than previously will trigger CUDA graphs capture
             # one should warmup with a number of generated tokens above max tokens targeted for subsequent generation
+            # hence, having min_new_tokens < max_new_tokens in the future doesn't make sense
             warmup_gen_kwargs = {
                 "min_new_tokens": self.gen_kwargs["max_new_tokens"],  # Yes, assign max_new_tokens to min_new_tokens
                 "max_new_tokens": self.gen_kwargs["max_new_tokens"],
-- 
GitLab