From f0ff12965af9c7a026e1d9c1884629adf9b8e9ab Mon Sep 17 00:00:00 2001
From: Guillaume Klein <guillaumekln@users.noreply.github.com>
Date: Fri, 1 Sep 2023 17:31:30 +0200
Subject: [PATCH] Expose generation parameter no_repeat_ngram_size (#449)

---
 faster_whisper/transcribe.py | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/faster_whisper/transcribe.py b/faster_whisper/transcribe.py
index 7ff27d2..326eecb 100644
--- a/faster_whisper/transcribe.py
+++ b/faster_whisper/transcribe.py
@@ -48,6 +48,7 @@ class TranscriptionOptions(NamedTuple):
     patience: float
     length_penalty: float
     repetition_penalty: float
+    no_repeat_ngram_size: int
     log_prob_threshold: Optional[float]
     no_speech_threshold: Optional[float]
     compression_ratio_threshold: Optional[float]
@@ -163,6 +164,7 @@ class WhisperModel:
         patience: float = 1,
         length_penalty: float = 1,
         repetition_penalty: float = 1,
+        no_repeat_ngram_size: int = 0,
         temperature: Union[float, List[float], Tuple[float, ...]] = [
             0.0,
             0.2,
@@ -202,6 +204,7 @@ class WhisperModel:
           length_penalty: Exponential length penalty constant.
           repetition_penalty: Penalty applied to the score of previously generated tokens
             (set > 1 to penalize).
+          no_repeat_ngram_size: Prevent repetitions of ngrams with this size (set 0 to disable).
           temperature: Temperature for sampling. It can be a tuple of temperatures,
             which will be successively used upon failures according to either
             `compression_ratio_threshold` or `log_prob_threshold`.
@@ -327,6 +330,7 @@ class WhisperModel:
             patience=patience,
             length_penalty=length_penalty,
             repetition_penalty=repetition_penalty,
+            no_repeat_ngram_size=no_repeat_ngram_size,
             log_prob_threshold=log_prob_threshold,
             no_speech_threshold=no_speech_threshold,
             compression_ratio_threshold=compression_ratio_threshold,
@@ -630,6 +634,7 @@ class WhisperModel:
                 [prompt],
                 length_penalty=options.length_penalty,
                 repetition_penalty=options.repetition_penalty,
+                no_repeat_ngram_size=options.no_repeat_ngram_size,
                 max_length=self.max_length,
                 return_scores=True,
                 return_no_speech_prob=True,