diff --git a/buzz/transcriber/local_whisper_cpp_server_transcriber.py b/buzz/transcriber/local_whisper_cpp_server_transcriber.py index 3b2d76dd..31dcdb92 100644 --- a/buzz/transcriber/local_whisper_cpp_server_transcriber.py +++ b/buzz/transcriber/local_whisper_cpp_server_transcriber.py @@ -25,7 +25,8 @@ class LocalWhisperCppServerTranscriber(OpenAIWhisperAPIFileTranscriber): "--port", "3000", "--inference-path", "/audio/transcriptions", "--threads", str(os.getenv("BUZZ_WHISPERCPP_N_THREADS", (os.cpu_count() or 8) // 2)), - "--model", task.model_path + "--model", task.model_path, + "--suppress-nst" ] if task.transcription_options.language is not None: diff --git a/buzz/transcriber/whisper_cpp.py b/buzz/transcriber/whisper_cpp.py index d43ea38b..b523fb73 100644 --- a/buzz/transcriber/whisper_cpp.py +++ b/buzz/transcriber/whisper_cpp.py @@ -166,6 +166,7 @@ class WhisperCpp: params.max_len = 1 if transcription_options.word_level_timings else 0 params.token_timestamps = transcription_options.word_level_timings params.initial_prompt = self.instance.get_string(transcription_options.initial_prompt) + params.suppress_nst = True # To prevent errors in transcripts with music return params def __del__(self): diff --git a/docs/docs/index.md b/docs/docs/index.md index 48395eec..a03d4efe 100644 --- a/docs/docs/index.md +++ b/docs/docs/index.md @@ -31,7 +31,7 @@ OpenAI's [Whisper](https://github.com/openai/whisper). - [Command-Line Interface](#command-line-interface) - Available on Mac, Windows, and Linux -## Transcription Viewer Interface +## Transcription Viewer Buzz features a powerful transcription viewer that makes it easy to work with your transcriptions: @@ -41,4 +41,4 @@ Buzz features a powerful transcription viewer that makes it easy to work with yo - **🎨 Clean Interface**: Conditional visibility keeps the interface uncluttered - **💾 State Persistence**: Remembers your preferences between sessions -[Learn more about the Transcription Viewer Interface →](https://chidiwilliams.github.io/buzz/docs/usage/transcription_viewer) +[Learn more about the Transcription Viewer →](https://chidiwilliams.github.io/buzz/docs/usage/transcription_viewer) diff --git a/docs/docs/usage/5_transcription_viewer.md b/docs/docs/usage/5_transcription_viewer.md index 598088f5..a4c9c9e2 100644 --- a/docs/docs/usage/5_transcription_viewer.md +++ b/docs/docs/usage/5_transcription_viewer.md @@ -1,4 +1,4 @@ -# Transcription Viewer Interface +# Transcription Viewer The Buzz transcription viewer provides a powerful interface for reviewing, editing, and navigating through your transcriptions. This guide covers all the features available in the transcription viewer. @@ -105,6 +105,7 @@ The search bar appears below the toolbar when activated and provides: - **Button Sizing**: Speed control buttons match the size of search navigation buttons for visual consistency ## Keyboard Shortcuts +(since version 1.3.0) ### Audio Playback - **`Ctrl+P` / `Cmd+P`**: Play/Pause audio