diff --git a/Whisper_Transcription_+_NeMo_Diarization.ipynb b/Whisper_Transcription_+_NeMo_Diarization.ipynb index d5bc226..c148146 100644 --- a/Whisper_Transcription_+_NeMo_Diarization.ipynb +++ b/Whisper_Transcription_+_NeMo_Diarization.ipynb @@ -29,7 +29,7 @@ }, "outputs": [], "source": [ - "!pip install git+https://github.com/SYSTRAN/faster-whisper.git ctranslate2==4.4.0\n", + "!pip install faster-whisper>=1.1.0 ctranslate2==4.4.0\n", "!pip install \"nemo-toolkit[asr]>=2.dev\"\n", "!pip install git+https://github.com/MahmoudAshraf97/demucs.git\n", "!pip install git+https://github.com/oliverguhr/deepmultilingualpunctuation.git\n", diff --git a/diarize.py b/diarize.py index 905c72e..d75243a 100644 --- a/diarize.py +++ b/diarize.py @@ -135,14 +135,12 @@ language, suppress_tokens=suppress_tokens, batch_size=args.batch_size, - without_timestamps=True, ) else: transcript_segments, info = whisper_model.transcribe( audio_waveform, language, suppress_tokens=suppress_tokens, - without_timestamps=True, vad_filter=True, ) diff --git a/diarize_parallel.py b/diarize_parallel.py index a071bd9..a4e45d5 100644 --- a/diarize_parallel.py +++ b/diarize_parallel.py @@ -137,14 +137,12 @@ language, suppress_tokens=suppress_tokens, batch_size=args.batch_size, - without_timestamps=True, ) else: transcript_segments, info = whisper_model.transcribe( audio_waveform, language, suppress_tokens=suppress_tokens, - without_timestamps=True, vad_filter=True, ) diff --git a/requirements.txt b/requirements.txt index a93fa06..928fcb4 100644 --- a/requirements.txt +++ b/requirements.txt @@ -1,7 +1,7 @@ wget nemo_toolkit[asr]==2.0.0rc0 nltk -git+https://github.com/SYSTRAN/faster-whisper.git +faster-whisper>=1.1.0 git+https://github.com/MahmoudAshraf97/demucs.git git+https://github.com/oliverguhr/deepmultilingualpunctuation.git git+https://github.com/MahmoudAshraf97/ctc-forced-aligner.git