Skip to content
Snippets Groups Projects
Commit 653b7ca5 authored by Andres Marafioti's avatar Andres Marafioti
Browse files

Assigning min new tokens to a compiled whisper graph on a thread breaks it

parent fc9f9602
No related branches found
No related tags found
No related merge requests found
...@@ -67,7 +67,7 @@ class WhisperSTTHandler(BaseHandler): ...@@ -67,7 +67,7 @@ class WhisperSTTHandler(BaseHandler):
# generating more tokens than previously will trigger CUDA graphs capture # generating more tokens than previously will trigger CUDA graphs capture
# one should warmup with a number of generated tokens above max tokens targeted for subsequent generation # one should warmup with a number of generated tokens above max tokens targeted for subsequent generation
warmup_gen_kwargs = { warmup_gen_kwargs = {
"min_new_tokens": self.gen_kwargs["min_new_tokens"], "min_new_tokens": self.gen_kwargs["max_new_tokens"], # Yes, assign max_new_tokens to min_new_tokens
"max_new_tokens": self.gen_kwargs["max_new_tokens"], "max_new_tokens": self.gen_kwargs["max_new_tokens"],
**self.gen_kwargs, **self.gen_kwargs,
} }
......
...@@ -33,12 +33,6 @@ class WhisperSTTHandlerArguments: ...@@ -33,12 +33,6 @@ class WhisperSTTHandlerArguments:
"help": "The maximum number of new tokens to generate. Default is 128." "help": "The maximum number of new tokens to generate. Default is 128."
}, },
) )
stt_gen_min_new_tokens: int = field(
default=0,
metadata={
"help": "The minimum number of new tokens to generate. Default is 0."
},
)
stt_gen_num_beams: int = field( stt_gen_num_beams: int = field(
default=1, default=1,
metadata={ metadata={
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment