From ae9898f0d8423bef75cbfde2cc397bd38f78a3b8 Mon Sep 17 00:00:00 2001 From: Guillaume Klein Date: Wed, 15 Mar 2023 15:30:29 +0100 Subject: [PATCH] Include duration in AudioInfo structure --- faster_whisper/transcribe.py | 3 +++ 1 file changed, 3 insertions(+) diff --git a/faster_whisper/transcribe.py b/faster_whisper/transcribe.py index 25ef989..5fa329c 100644 --- a/faster_whisper/transcribe.py +++ b/faster_whisper/transcribe.py @@ -31,6 +31,7 @@ class Segment(NamedTuple): class AudioInfo(NamedTuple): language: str language_probability: float + duration: float class TranscriptionOptions(NamedTuple): @@ -193,6 +194,7 @@ class WhisperModel: audio, sampling_rate=self.feature_extractor.sampling_rate ) + duration = audio.shape[0] / self.feature_extractor.sampling_rate features = self.feature_extractor(audio) if language is None: @@ -243,6 +245,7 @@ class WhisperModel: audio_info = AudioInfo( language=language, language_probability=language_probability, + duration=duration, ) return segments, audio_info