diff --git a/pyproject.toml b/pyproject.toml index 7ad075c4a..bd22bfdad 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -2,7 +2,7 @@ urls = { repository = "https://github.com/m-bain/whisperx" } authors = [{ name = "Max Bain" }] name = "whisperx" -version = "3.4.0" +version = "3.4.1" description = "Time-Accurate Automatic Speech Recognition using Whisper." readme = "README.md" requires-python = ">=3.9, <3.13" diff --git a/uv.lock b/uv.lock index b7ce4d8ba..e24a7a4e8 100644 --- a/uv.lock +++ b/uv.lock @@ -2788,7 +2788,7 @@ wheels = [ [[package]] name = "whisperx" -version = "3.4.0" +version = "3.4.1" source = { editable = "." } dependencies = [ { name = "ctranslate2" }, diff --git a/whisperx/transcribe.py b/whisperx/transcribe.py index c1b599a48..46a774688 100644 --- a/whisperx/transcribe.py +++ b/whisperx/transcribe.py @@ -213,12 +213,19 @@ def transcribe_task(args: dict, parser: argparse.ArgumentParser): results = [] diarize_model = DiarizationPipeline(model_name=diarize_model_name, use_auth_token=hf_token, device=device) for result, input_audio_path in tmp_results: - diarize_segments, speaker_embeddings = diarize_model( + diarize_result = diarize_model( input_audio_path, min_speakers=min_speakers, max_speakers=max_speakers, return_embeddings=return_speaker_embeddings ) + + if return_speaker_embeddings: + diarize_segments, speaker_embeddings = diarize_result + else: + diarize_segments = diarize_result + speaker_embeddings = None + result = assign_word_speakers(diarize_segments, result, speaker_embeddings) results.append((result, input_audio_path)) # >> Write