diff --git a/404.html b/404.html index 1e1633d1..1756226b 100644 --- a/404.html +++ b/404.html @@ -4,13 +4,13 @@ Page Not Found | Buzz - +
Skip to main content

Page Not Found

We could not find what you were looking for.

Please contact the owner of the site that linked you to the original URL and let them know their link is broken.

- + \ No newline at end of file diff --git a/assets/js/2c266bbb.2d6b08c4.js b/assets/js/2c266bbb.2d6b08c4.js deleted file mode 100644 index eeb10ef6..00000000 --- a/assets/js/2c266bbb.2d6b08c4.js +++ /dev/null @@ -1 +0,0 @@ -"use strict";(self.webpackChunkdocs=self.webpackChunkdocs||[]).push([[799],{3905:(e,t,n)=>{n.d(t,{Zo:()=>s,kt:()=>g});var a=n(7294);function r(e,t,n){return t in e?Object.defineProperty(e,t,{value:n,enumerable:!0,configurable:!0,writable:!0}):e[t]=n,e}function o(e,t){var n=Object.keys(e);if(Object.getOwnPropertySymbols){var a=Object.getOwnPropertySymbols(e);t&&(a=a.filter((function(t){return Object.getOwnPropertyDescriptor(e,t).enumerable}))),n.push.apply(n,a)}return n}function i(e){for(var t=1;t=0||(r[n]=e[n]);return r}(e,t);if(Object.getOwnPropertySymbols){var o=Object.getOwnPropertySymbols(e);for(a=0;a=0||Object.prototype.propertyIsEnumerable.call(e,n)&&(r[n]=e[n])}return r}var p=a.createContext({}),u=function(e){var t=a.useContext(p),n=t;return e&&(n="function"==typeof e?e(t):i(i({},t),e)),n},s=function(e){var t=u(e.components);return a.createElement(p.Provider,{value:t},e.children)},c="mdxType",d={inlineCode:"code",wrapper:function(e){var t=e.children;return a.createElement(a.Fragment,{},t)}},m=a.forwardRef((function(e,t){var n=e.components,r=e.mdxType,o=e.originalType,p=e.parentName,s=l(e,["components","mdxType","originalType","parentName"]),c=u(n),m=r,g=c["".concat(p,".").concat(m)]||c[m]||d[m]||o;return n?a.createElement(g,i(i({ref:t},s),{},{components:n})):a.createElement(g,i({ref:t},s))}));function g(e,t){var n=arguments,r=t&&t.mdxType;if("string"==typeof e||r){var o=n.length,i=new Array(o);i[0]=m;var l={};for(var p in t)hasOwnProperty.call(t,p)&&(l[p]=t[p]);l.originalType=e,l[c]="string"==typeof e?e:r,i[1]=l;for(var u=2;u{n.r(t),n.d(t,{assets:()=>p,contentTitle:()=>i,default:()=>d,frontMatter:()=>o,metadata:()=>l,toc:()=>u});var a=n(7462),r=(n(7294),n(3905));const o={title:"Live Recording"},i=void 0,l={unversionedId:"usage/live_recording",id:"usage/live_recording",title:"Live Recording",description:"To start a live recording:",source:"@site/docs/usage/2_live_recording.md",sourceDirName:"usage",slug:"/usage/live_recording",permalink:"/buzz/docs/usage/live_recording",draft:!1,tags:[],version:"current",sidebarPosition:2,frontMatter:{title:"Live Recording"},sidebar:"tutorialSidebar",previous:{title:"File Import",permalink:"/buzz/docs/usage/file_import"},next:{title:"Translations",permalink:"/buzz/docs/usage/translations"}},p={},u=[{value:"Advanced preferences",id:"advanced-preferences",level:4},{value:"Presentation Window",id:"presentation-window",level:4},{value:"Record audio playing from computer (macOS)",id:"record-audio-playing-from-computer-macos",level:3},{value:"Record audio playing from computer (Windows)",id:"record-audio-playing-from-computer-windows",level:3},{value:"Record audio playing from computer (Linux)",id:"record-audio-playing-from-computer-linux",level:3}],s={toc:u},c="wrapper";function d(e){let{components:t,...n}=e;return(0,r.kt)(c,(0,a.Z)({},s,n,{components:t,mdxType:"MDXLayout"}),(0,r.kt)("p",null,"To start a live recording:"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},"Select a recording task, language, quality, and microphone."),(0,r.kt)("li",{parentName:"ul"},"Click Record.")),(0,r.kt)("blockquote",null,(0,r.kt)("p",{parentName:"blockquote"},(0,r.kt)("strong",{parentName:"p"},"Note:")," Transcribing audio using the default Whisper model is resource-intensive. Consider using the Whisper.cpp.\nIt supports GPU acceleration, if the model fits in GPU memory. Use smaller models for real-time performance.")),(0,r.kt)("table",null,(0,r.kt)("thead",{parentName:"table"},(0,r.kt)("tr",{parentName:"thead"},(0,r.kt)("th",{parentName:"tr",align:null},"Field"),(0,r.kt)("th",{parentName:"tr",align:null},"Options"),(0,r.kt)("th",{parentName:"tr",align:null},"Default"),(0,r.kt)("th",{parentName:"tr",align:null},"Description"))),(0,r.kt)("tbody",{parentName:"table"},(0,r.kt)("tr",{parentName:"tbody"},(0,r.kt)("td",{parentName:"tr",align:null},"Task"),(0,r.kt)("td",{parentName:"tr",align:null},'"Transcribe", "Translate to English"'),(0,r.kt)("td",{parentName:"tr",align:null},'"Transcribe"'),(0,r.kt)("td",{parentName:"tr",align:null},'"Transcribe" converts the input audio into text in the selected language, while "Translate to English" converts it into text in English.')),(0,r.kt)("tr",{parentName:"tbody"},(0,r.kt)("td",{parentName:"tr",align:null},"Language"),(0,r.kt)("td",{parentName:"tr",align:null},"See ",(0,r.kt)("a",{parentName:"td",href:"https://github.com/openai/whisper#available-models-and-languages"},"Whisper's documentation")," for the full list of supported languages"),(0,r.kt)("td",{parentName:"tr",align:null},'"Detect Language"'),(0,r.kt)("td",{parentName:"tr",align:null},'"Detect Language" will try to detect the spoken language in the audio based on the first few seconds. However, selecting a language is recommended (if known) as it will improve transcription quality in many cases.')),(0,r.kt)("tr",{parentName:"tbody"},(0,r.kt)("td",{parentName:"tr",align:null},"Microphone"),(0,r.kt)("td",{parentName:"tr",align:null},"[Available system microphones]"),(0,r.kt)("td",{parentName:"tr",align:null},"[Default system microphone]"),(0,r.kt)("td",{parentName:"tr",align:null},"Microphone for recording input audio.")))),(0,r.kt)("p",null,(0,r.kt)("a",{parentName:"p",href:"https://www.loom.com/share/564b753eb4d44b55b985b8abd26b55f7",title:"Live Recording on Buzz"},(0,r.kt)("img",{parentName:"a",src:"https://cdn.loom.com/sessions/thumbnails/564b753eb4d44b55b985b8abd26b55f7-with-play.gif",alt:"Live Recording on Buzz"}))),(0,r.kt)("h4",{id:"advanced-preferences"},"Advanced preferences"),(0,r.kt)("p",null,(0,r.kt)("strong",{parentName:"p"},"Silence threshold")," Set threshold to for transcriptions to be processed. If average volume level is under this setting the sentence will not be transcribed. Available since 1.4.4.\n",(0,r.kt)("strong",{parentName:"p"},"Line separator")," Marking to add to the transcription and translation lines. Default value is two new lines (",(0,r.kt)("inlineCode",{parentName:"p"},"\\n\\n"),") that result in an empty space between translation or transcription lines. To have no empty line use ",(0,r.kt)("inlineCode",{parentName:"p"},"\\n"),". Available since 1.4.4."),(0,r.kt)("h4",{id:"presentation-window"},"Presentation Window"),(0,r.kt)("p",null,"Since 1.4.2 Buzz has an easy to use presentation window you can use to show live transcriptions during events and presentations. To open it start the recording and new options for the ",(0,r.kt)("inlineCode",{parentName:"p"},"Presentation window")," will appear."),(0,r.kt)("h3",{id:"record-audio-playing-from-computer-macos"},"Record audio playing from computer (macOS)"),(0,r.kt)("p",null,"To record audio playing from an application on your computer, you may install an audio loopback driver (a program that\nlets you create virtual audio devices). The rest of this guide will\nuse ",(0,r.kt)("a",{parentName:"p",href:"https://github.com/ExistentialAudio/BlackHole"},"BlackHole")," on Mac, but you can use other alternatives for your\noperating system (\nsee ",(0,r.kt)("a",{parentName:"p",href:"https://nerds.de/en/loopbeaudio.html"},"LoopBeAudio"),", ",(0,r.kt)("a",{parentName:"p",href:"https://rogueamoeba.com/loopback/"},"LoopBack"),",\nand ",(0,r.kt)("a",{parentName:"p",href:"https://vac.muzychenko.net/en/"},"Virtual Audio Cable"),")."),(0,r.kt)("ol",null,(0,r.kt)("li",{parentName:"ol"},(0,r.kt)("p",{parentName:"li"},"Install ",(0,r.kt)("a",{parentName:"p",href:"https://github.com/ExistentialAudio/BlackHole#option-2-install-via-homebrew"},"BlackHole via Homebrew")),(0,r.kt)("pre",{parentName:"li"},(0,r.kt)("code",{parentName:"pre",className:"language-shell"},"brew install blackhole-2ch\n"))),(0,r.kt)("li",{parentName:"ol"},(0,r.kt)("p",{parentName:"li"},"Open Audio MIDI Setup from Spotlight or from ",(0,r.kt)("inlineCode",{parentName:"p"},"/Applications/Utilities/Audio Midi Setup.app"),"."),(0,r.kt)("p",{parentName:"li"},(0,r.kt)("img",{parentName:"p",src:"https://existential.audio/howto/img/spotlight.png",alt:"Open Audio MIDI Setup from Spotlight"}))),(0,r.kt)("li",{parentName:"ol"},(0,r.kt)("p",{parentName:"li"},"Click the '+' icon at the lower left corner and select 'Create Multi-Output Device'."),(0,r.kt)("p",{parentName:"li"},(0,r.kt)("img",{parentName:"p",src:"https://existential.audio/howto/img/createmulti-output.png",alt:"Create multi-output device"}))),(0,r.kt)("li",{parentName:"ol"},(0,r.kt)("p",{parentName:"li"},"Add your default speaker and BlackHole to the multi-output device."),(0,r.kt)("p",{parentName:"li"},(0,r.kt)("img",{parentName:"p",src:"https://existential.audio/howto/img/multi-output.png",alt:"Screenshot of multi-output device"}))),(0,r.kt)("li",{parentName:"ol"},(0,r.kt)("p",{parentName:"li"},"Select this multi-output device as your speaker (application or system-wide) to play audio into BlackHole.")),(0,r.kt)("li",{parentName:"ol"},(0,r.kt)("p",{parentName:"li"},"Open Buzz, select BlackHole as your microphone, and record as before to see transcriptions from the audio playing\nthrough BlackHole."))),(0,r.kt)("h3",{id:"record-audio-playing-from-computer-windows"},"Record audio playing from computer (Windows)"),(0,r.kt)("p",null,"To transcribe system audio you need to configure virtual audio device and connect output from the applications you whant to transcribe to this virtual speaker. After that you can select it as source in the Buzz."),(0,r.kt)("ol",null,(0,r.kt)("li",{parentName:"ol"},(0,r.kt)("p",{parentName:"li"},"Install ",(0,r.kt)("a",{parentName:"p",href:"https://vb-audio.com/Cable/"},"VB CABLE")," as virtual audio device. ")),(0,r.kt)("li",{parentName:"ol"},(0,r.kt)("p",{parentName:"li"},'Configure using Windows Sound settings. Right-click on the speaker icon in the system tray and select "Open Sound settings". In the "Choose your output device" dropdown select "CABLE Input" to send all system sound to the virtual device or use "Advanced sound options" to select application that will output their sound to this device.'))),(0,r.kt)("h3",{id:"record-audio-playing-from-computer-linux"},"Record audio playing from computer (Linux)"),(0,r.kt)("p",null,"As described on ",(0,r.kt)("a",{parentName:"p",href:"https://wiki.ubuntu.com/record_system_sound"},"Ubuntu Wiki")," on any Linux with pulse audio you can redirect application audio to a virtual speaker. After that you can select it as source in Buzz."),(0,r.kt)("p",null,"Overall steps:"),(0,r.kt)("ol",null,(0,r.kt)("li",{parentName:"ol"},"Launch application that will produce the sound you want to transcribe and start the playback. For example start a video in a media player. "),(0,r.kt)("li",{parentName:"ol"},"Launch Buzz and open Live recording screen, so you see the settings."),(0,r.kt)("li",{parentName:"ol"},"Configure sound routing from the application you want to transcribe sound from to Buzz in ",(0,r.kt)("inlineCode",{parentName:"li"},"Recording tab")," of the PulseAudio Volume Control (",(0,r.kt)("inlineCode",{parentName:"li"},"pavucontrol"),").")))}d.isMDXComponent=!0}}]); \ No newline at end of file diff --git a/assets/js/2c266bbb.7fe1d26b.js b/assets/js/2c266bbb.7fe1d26b.js new file mode 100644 index 00000000..805b2aeb --- /dev/null +++ b/assets/js/2c266bbb.7fe1d26b.js @@ -0,0 +1 @@ +"use strict";(self.webpackChunkdocs=self.webpackChunkdocs||[]).push([[799],{3905:(e,t,n)=>{n.d(t,{Zo:()=>u,kt:()=>g});var a=n(7294);function r(e,t,n){return t in e?Object.defineProperty(e,t,{value:n,enumerable:!0,configurable:!0,writable:!0}):e[t]=n,e}function o(e,t){var n=Object.keys(e);if(Object.getOwnPropertySymbols){var a=Object.getOwnPropertySymbols(e);t&&(a=a.filter((function(t){return Object.getOwnPropertyDescriptor(e,t).enumerable}))),n.push.apply(n,a)}return n}function i(e){for(var t=1;t=0||(r[n]=e[n]);return r}(e,t);if(Object.getOwnPropertySymbols){var o=Object.getOwnPropertySymbols(e);for(a=0;a=0||Object.prototype.propertyIsEnumerable.call(e,n)&&(r[n]=e[n])}return r}var p=a.createContext({}),s=function(e){var t=a.useContext(p),n=t;return e&&(n="function"==typeof e?e(t):i(i({},t),e)),n},u=function(e){var t=s(e.components);return a.createElement(p.Provider,{value:t},e.children)},c="mdxType",d={inlineCode:"code",wrapper:function(e){var t=e.children;return a.createElement(a.Fragment,{},t)}},m=a.forwardRef((function(e,t){var n=e.components,r=e.mdxType,o=e.originalType,p=e.parentName,u=l(e,["components","mdxType","originalType","parentName"]),c=s(n),m=r,g=c["".concat(p,".").concat(m)]||c[m]||d[m]||o;return n?a.createElement(g,i(i({ref:t},u),{},{components:n})):a.createElement(g,i({ref:t},u))}));function g(e,t){var n=arguments,r=t&&t.mdxType;if("string"==typeof e||r){var o=n.length,i=new Array(o);i[0]=m;var l={};for(var p in t)hasOwnProperty.call(t,p)&&(l[p]=t[p]);l.originalType=e,l[c]="string"==typeof e?e:r,i[1]=l;for(var s=2;s{n.r(t),n.d(t,{assets:()=>p,contentTitle:()=>i,default:()=>d,frontMatter:()=>o,metadata:()=>l,toc:()=>s});var a=n(7462),r=(n(7294),n(3905));const o={title:"Live Recording"},i=void 0,l={unversionedId:"usage/live_recording",id:"usage/live_recording",title:"Live Recording",description:"To start a live recording:",source:"@site/docs/usage/2_live_recording.md",sourceDirName:"usage",slug:"/usage/live_recording",permalink:"/buzz/docs/usage/live_recording",draft:!1,tags:[],version:"current",sidebarPosition:2,frontMatter:{title:"Live Recording"},sidebar:"tutorialSidebar",previous:{title:"File Import",permalink:"/buzz/docs/usage/file_import"},next:{title:"Translations",permalink:"/buzz/docs/usage/translations"}},p={},s=[{value:"Advanced preferences",id:"advanced-preferences",level:4},{value:"Presentation Window",id:"presentation-window",level:4},{value:"Record audio playing from computer (macOS)",id:"record-audio-playing-from-computer-macos",level:3},{value:"Record audio playing from computer (Windows)",id:"record-audio-playing-from-computer-windows",level:3},{value:"Record audio playing from computer (Linux)",id:"record-audio-playing-from-computer-linux",level:3}],u={toc:s},c="wrapper";function d(e){let{components:t,...n}=e;return(0,r.kt)(c,(0,a.Z)({},u,n,{components:t,mdxType:"MDXLayout"}),(0,r.kt)("p",null,"To start a live recording:"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},"Select a recording task, language, quality, and microphone."),(0,r.kt)("li",{parentName:"ul"},"Click Record.")),(0,r.kt)("blockquote",null,(0,r.kt)("p",{parentName:"blockquote"},(0,r.kt)("strong",{parentName:"p"},"Note:")," Transcribing audio using the default Whisper model is resource-intensive. Consider using the Whisper.cpp.\nIt supports GPU acceleration, if the model fits in GPU memory. Use smaller models for real-time performance.")),(0,r.kt)("table",null,(0,r.kt)("thead",{parentName:"table"},(0,r.kt)("tr",{parentName:"thead"},(0,r.kt)("th",{parentName:"tr",align:null},"Field"),(0,r.kt)("th",{parentName:"tr",align:null},"Options"),(0,r.kt)("th",{parentName:"tr",align:null},"Default"),(0,r.kt)("th",{parentName:"tr",align:null},"Description"))),(0,r.kt)("tbody",{parentName:"table"},(0,r.kt)("tr",{parentName:"tbody"},(0,r.kt)("td",{parentName:"tr",align:null},"Task"),(0,r.kt)("td",{parentName:"tr",align:null},'"Transcribe", "Translate to English"'),(0,r.kt)("td",{parentName:"tr",align:null},'"Transcribe"'),(0,r.kt)("td",{parentName:"tr",align:null},'"Transcribe" converts the input audio into text in the selected language, while "Translate to English" converts it into text in English.')),(0,r.kt)("tr",{parentName:"tbody"},(0,r.kt)("td",{parentName:"tr",align:null},"Language"),(0,r.kt)("td",{parentName:"tr",align:null},"See ",(0,r.kt)("a",{parentName:"td",href:"https://github.com/openai/whisper#available-models-and-languages"},"Whisper's documentation")," for the full list of supported languages"),(0,r.kt)("td",{parentName:"tr",align:null},'"Detect Language"'),(0,r.kt)("td",{parentName:"tr",align:null},'"Detect Language" will try to detect the spoken language in the audio based on the first few seconds. However, selecting a language is recommended (if known) as it will improve transcription quality in many cases.')),(0,r.kt)("tr",{parentName:"tbody"},(0,r.kt)("td",{parentName:"tr",align:null},"Microphone"),(0,r.kt)("td",{parentName:"tr",align:null},"[Available system microphones]"),(0,r.kt)("td",{parentName:"tr",align:null},"[Default system microphone]"),(0,r.kt)("td",{parentName:"tr",align:null},"Microphone for recording input audio.")))),(0,r.kt)("p",null,(0,r.kt)("a",{parentName:"p",href:"https://www.loom.com/share/564b753eb4d44b55b985b8abd26b55f7",title:"Live Recording on Buzz"},(0,r.kt)("img",{parentName:"a",src:"https://cdn.loom.com/sessions/thumbnails/564b753eb4d44b55b985b8abd26b55f7-with-play.gif",alt:"Live Recording on Buzz"}))),(0,r.kt)("h4",{id:"advanced-preferences"},"Advanced preferences"),(0,r.kt)("p",null,(0,r.kt)("strong",{parentName:"p"},"Silence threshold")," Set threshold to for transcriptions to be processed. If average volume level is under this setting the sentence will not be transcribed. Available since 1.4.4."),(0,r.kt)("p",null,(0,r.kt)("strong",{parentName:"p"},"Line separator")," Marking to add to the transcription and translation lines. Default value is two new lines (",(0,r.kt)("inlineCode",{parentName:"p"},"\\n\\n"),") that result in an empty space between translation or transcription lines. To have no empty line use ",(0,r.kt)("inlineCode",{parentName:"p"},"\\n"),". Available since 1.4.4."),(0,r.kt)("p",null,(0,r.kt)("strong",{parentName:"p"},"Transcription step")," If live recording mode is set to ",(0,r.kt)("inlineCode",{parentName:"p"},"Append and correct"),", you can also set a transcription step. Shorter steps will reduce latency but cause larger load on the system. Monitor the ",(0,r.kt)("inlineCode",{parentName:"p"},"Queue")," while transcribing in this mode, if it grows too much, increase the transcription step, to reduce load. Available since 1.4.4."),(0,r.kt)("p",null,(0,r.kt)("strong",{parentName:"p"},"Hide unconfirmed")," If live recording mode is set to ",(0,r.kt)("inlineCode",{parentName:"p"},"Append and correct"),", you can also hide the unconfirmed part of the last transcript. This part may be incorrect as the Buzz has seen it only in one overlapping transcription segment. Hiding it will increase latency, but result will show only the correct transcripts. Available since 1.4.4."),(0,r.kt)("h4",{id:"presentation-window"},"Presentation Window"),(0,r.kt)("p",null,"Buzz has an easy to use presentation window you can use to show live transcriptions during events and presentations. To open it start the recording and new options for the ",(0,r.kt)("inlineCode",{parentName:"p"},"Presentation window")," will appear."),(0,r.kt)("h3",{id:"record-audio-playing-from-computer-macos"},"Record audio playing from computer (macOS)"),(0,r.kt)("p",null,"To record audio playing from an application on your computer, you may install an audio loopback driver (a program that\nlets you create virtual audio devices). The rest of this guide will\nuse ",(0,r.kt)("a",{parentName:"p",href:"https://github.com/ExistentialAudio/BlackHole"},"BlackHole")," on Mac, but you can use other alternatives for your\noperating system (\nsee ",(0,r.kt)("a",{parentName:"p",href:"https://nerds.de/en/loopbeaudio.html"},"LoopBeAudio"),", ",(0,r.kt)("a",{parentName:"p",href:"https://rogueamoeba.com/loopback/"},"LoopBack"),",\nand ",(0,r.kt)("a",{parentName:"p",href:"https://vac.muzychenko.net/en/"},"Virtual Audio Cable"),")."),(0,r.kt)("ol",null,(0,r.kt)("li",{parentName:"ol"},(0,r.kt)("p",{parentName:"li"},"Install ",(0,r.kt)("a",{parentName:"p",href:"https://github.com/ExistentialAudio/BlackHole#option-2-install-via-homebrew"},"BlackHole via Homebrew")),(0,r.kt)("pre",{parentName:"li"},(0,r.kt)("code",{parentName:"pre",className:"language-shell"},"brew install blackhole-2ch\n"))),(0,r.kt)("li",{parentName:"ol"},(0,r.kt)("p",{parentName:"li"},"Open Audio MIDI Setup from Spotlight or from ",(0,r.kt)("inlineCode",{parentName:"p"},"/Applications/Utilities/Audio Midi Setup.app"),"."),(0,r.kt)("p",{parentName:"li"},(0,r.kt)("img",{parentName:"p",src:"https://existential.audio/howto/img/spotlight.png",alt:"Open Audio MIDI Setup from Spotlight"}))),(0,r.kt)("li",{parentName:"ol"},(0,r.kt)("p",{parentName:"li"},"Click the '+' icon at the lower left corner and select 'Create Multi-Output Device'."),(0,r.kt)("p",{parentName:"li"},(0,r.kt)("img",{parentName:"p",src:"https://existential.audio/howto/img/createmulti-output.png",alt:"Create multi-output device"}))),(0,r.kt)("li",{parentName:"ol"},(0,r.kt)("p",{parentName:"li"},"Add your default speaker and BlackHole to the multi-output device."),(0,r.kt)("p",{parentName:"li"},(0,r.kt)("img",{parentName:"p",src:"https://existential.audio/howto/img/multi-output.png",alt:"Screenshot of multi-output device"}))),(0,r.kt)("li",{parentName:"ol"},(0,r.kt)("p",{parentName:"li"},"Select this multi-output device as your speaker (application or system-wide) to play audio into BlackHole.")),(0,r.kt)("li",{parentName:"ol"},(0,r.kt)("p",{parentName:"li"},"Open Buzz, select BlackHole as your microphone, and record as before to see transcriptions from the audio playing\nthrough BlackHole."))),(0,r.kt)("h3",{id:"record-audio-playing-from-computer-windows"},"Record audio playing from computer (Windows)"),(0,r.kt)("p",null,"To transcribe system audio you need to configure virtual audio device and connect output from the applications you whant to transcribe to this virtual speaker. After that you can select it as source in the Buzz."),(0,r.kt)("ol",null,(0,r.kt)("li",{parentName:"ol"},(0,r.kt)("p",{parentName:"li"},"Install ",(0,r.kt)("a",{parentName:"p",href:"https://vb-audio.com/Cable/"},"VB CABLE")," as virtual audio device. ")),(0,r.kt)("li",{parentName:"ol"},(0,r.kt)("p",{parentName:"li"},'Configure using Windows Sound settings. Right-click on the speaker icon in the system tray and select "Open Sound settings". In the "Choose your output device" dropdown select "CABLE Input" to send all system sound to the virtual device or use "Advanced sound options" to select application that will output their sound to this device.'))),(0,r.kt)("h3",{id:"record-audio-playing-from-computer-linux"},"Record audio playing from computer (Linux)"),(0,r.kt)("p",null,"As described on ",(0,r.kt)("a",{parentName:"p",href:"https://wiki.ubuntu.com/record_system_sound"},"Ubuntu Wiki")," on any Linux with pulse audio you can redirect application audio to a virtual speaker. After that you can select it as source in Buzz."),(0,r.kt)("p",null,"Overall steps:"),(0,r.kt)("ol",null,(0,r.kt)("li",{parentName:"ol"},"Launch application that will produce the sound you want to transcribe and start the playback. For example start a video in a media player. "),(0,r.kt)("li",{parentName:"ol"},"Launch Buzz and open Live recording screen, so you see the settings."),(0,r.kt)("li",{parentName:"ol"},"Configure sound routing from the application you want to transcribe sound from to Buzz in ",(0,r.kt)("inlineCode",{parentName:"li"},"Recording tab")," of the PulseAudio Volume Control (",(0,r.kt)("inlineCode",{parentName:"li"},"pavucontrol"),").")))}d.isMDXComponent=!0}}]); \ No newline at end of file diff --git a/assets/js/343de823.33e65bd6.js b/assets/js/343de823.33e65bd6.js new file mode 100644 index 00000000..2665c86c --- /dev/null +++ b/assets/js/343de823.33e65bd6.js @@ -0,0 +1 @@ +"use strict";(self.webpackChunkdocs=self.webpackChunkdocs||[]).push([[884],{3905:(t,e,n)=>{n.d(e,{Zo:()=>c,kt:()=>m});var r=n(7294);function o(t,e,n){return e in t?Object.defineProperty(t,e,{value:n,enumerable:!0,configurable:!0,writable:!0}):t[e]=n,t}function a(t,e){var n=Object.keys(t);if(Object.getOwnPropertySymbols){var r=Object.getOwnPropertySymbols(t);e&&(r=r.filter((function(e){return Object.getOwnPropertyDescriptor(t,e).enumerable}))),n.push.apply(n,r)}return n}function i(t){for(var e=1;e=0||(o[n]=t[n]);return o}(t,e);if(Object.getOwnPropertySymbols){var a=Object.getOwnPropertySymbols(t);for(r=0;r=0||Object.prototype.propertyIsEnumerable.call(t,n)&&(o[n]=t[n])}return o}var l=r.createContext({}),u=function(t){var e=r.useContext(l),n=e;return t&&(n="function"==typeof t?t(e):i(i({},e),t)),n},c=function(t){var e=u(t.components);return r.createElement(l.Provider,{value:e},t.children)},p="mdxType",d={inlineCode:"code",wrapper:function(t){var e=t.children;return r.createElement(r.Fragment,{},e)}},f=r.forwardRef((function(t,e){var n=t.components,o=t.mdxType,a=t.originalType,l=t.parentName,c=s(t,["components","mdxType","originalType","parentName"]),p=u(n),f=o,m=p["".concat(l,".").concat(f)]||p[f]||d[f]||a;return n?r.createElement(m,i(i({ref:e},c),{},{components:n})):r.createElement(m,i({ref:e},c))}));function m(t,e){var n=arguments,o=e&&e.mdxType;if("string"==typeof t||o){var a=n.length,i=new Array(a);i[0]=f;var s={};for(var l in e)hasOwnProperty.call(e,l)&&(s[l]=e[l]);s.originalType=t,s[p]="string"==typeof t?t:o,i[1]=s;for(var u=2;u{n.r(e),n.d(e,{assets:()=>l,contentTitle:()=>i,default:()=>d,frontMatter:()=>a,metadata:()=>s,toc:()=>u});var r=n(7462),o=(n(7294),n(3905));const a={title:"Translations"},i=void 0,s={unversionedId:"usage/translations",id:"usage/translations",title:"Translations",description:"Default Translation task uses Whisper model ability to translate to English, however Large-V3-Turbo is not compatible with this standard. Buzz supports additional AI translations to any other language.",source:"@site/docs/usage/3_translations.md",sourceDirName:"usage",slug:"/usage/translations",permalink:"/buzz/docs/usage/translations",draft:!1,tags:[],version:"current",sidebarPosition:3,frontMatter:{title:"Translations"},sidebar:"tutorialSidebar",previous:{title:"Live Recording",permalink:"/buzz/docs/usage/live_recording"},next:{title:"Edit and Resize",permalink:"/buzz/docs/usage/edit_and_resize"}},l={},u=[],c={toc:u},p="wrapper";function d(t){let{components:e,...n}=t;return(0,o.kt)(p,(0,r.Z)({},c,n,{components:e,mdxType:"MDXLayout"}),(0,o.kt)("p",null,"Default ",(0,o.kt)("inlineCode",{parentName:"p"},"Translation")," task uses Whisper model ability to translate to English, however ",(0,o.kt)("inlineCode",{parentName:"p"},"Large-V3-Turbo")," is not compatible with this standard. Buzz supports additional AI translations to any other language."),(0,o.kt)("p",null,"To use translation feature you will need to configure OpenAI API key and translation settings. Set OpenAI API ket in Preferences. Buzz also supports custom locally running translation AIs that support OpenAI API. For more information on locally running AIs see ",(0,o.kt)("a",{parentName:"p",href:"https://ollama.com/blog/openai-compatibility"},"ollama")," or ",(0,o.kt)("a",{parentName:"p",href:"https://lmstudio.ai/"},"LM Studio"),". For information on available custom APIs see this ",(0,o.kt)("a",{parentName:"p",href:"https://github.com/chidiwilliams/buzz/discussions/827"},"discussion thread"),"."),(0,o.kt)("p",null,"To configure translation for Live recordings enable it in Advances settings dialog of the Live Recording settings. Enter AI model to use and prompt with instructions for the AI on how to translate. Translation option is also available for files that already have speech recognised. Use Translate button on transcription viewer toolbar."),(0,o.kt)("p",null,'For AI to know how to translate enter translation instructions in the "Instructions for AI" section. In your instructions you should describe to what language you want it to translate the text to. Also, you may need to add additional instructions to not add any notes or comments as AIs tend to add them. Example instructions to translate English subtitles to Spanish:'),(0,o.kt)("blockquote",null,(0,o.kt)("p",{parentName:"blockquote"},"You are a professional translator, skilled in translating English to Spanish. You will only translate each sentence sent to you into Spanish and not add any notes or comments.")),(0,o.kt)("p",null,'If you enable "Enable live recording transcription export" in Preferences, Live text transcripts will be exported to a text file as they get generated and translated. This file can be used to further integrate Live transcripts with other applications like OBS Studio.'),(0,o.kt)("p",null,"Approximate cost of translation for 1 hour long audio with ChatGPT ",(0,o.kt)("inlineCode",{parentName:"p"},"gpt-4o")," model is around $0.50."))}d.isMDXComponent=!0}}]); \ No newline at end of file diff --git a/assets/js/343de823.d33c8b39.js b/assets/js/343de823.d33c8b39.js deleted file mode 100644 index 7a98d69a..00000000 --- a/assets/js/343de823.d33c8b39.js +++ /dev/null @@ -1 +0,0 @@ -"use strict";(self.webpackChunkdocs=self.webpackChunkdocs||[]).push([[884],{3905:(t,e,n)=>{n.d(e,{Zo:()=>c,kt:()=>m});var r=n(7294);function o(t,e,n){return e in t?Object.defineProperty(t,e,{value:n,enumerable:!0,configurable:!0,writable:!0}):t[e]=n,t}function a(t,e){var n=Object.keys(t);if(Object.getOwnPropertySymbols){var r=Object.getOwnPropertySymbols(t);e&&(r=r.filter((function(e){return Object.getOwnPropertyDescriptor(t,e).enumerable}))),n.push.apply(n,r)}return n}function i(t){for(var e=1;e=0||(o[n]=t[n]);return o}(t,e);if(Object.getOwnPropertySymbols){var a=Object.getOwnPropertySymbols(t);for(r=0;r=0||Object.prototype.propertyIsEnumerable.call(t,n)&&(o[n]=t[n])}return o}var l=r.createContext({}),u=function(t){var e=r.useContext(l),n=e;return t&&(n="function"==typeof t?t(e):i(i({},e),t)),n},c=function(t){var e=u(t.components);return r.createElement(l.Provider,{value:e},t.children)},p="mdxType",d={inlineCode:"code",wrapper:function(t){var e=t.children;return r.createElement(r.Fragment,{},e)}},f=r.forwardRef((function(t,e){var n=t.components,o=t.mdxType,a=t.originalType,l=t.parentName,c=s(t,["components","mdxType","originalType","parentName"]),p=u(n),f=o,m=p["".concat(l,".").concat(f)]||p[f]||d[f]||a;return n?r.createElement(m,i(i({ref:e},c),{},{components:n})):r.createElement(m,i({ref:e},c))}));function m(t,e){var n=arguments,o=e&&e.mdxType;if("string"==typeof t||o){var a=n.length,i=new Array(a);i[0]=f;var s={};for(var l in e)hasOwnProperty.call(e,l)&&(s[l]=e[l]);s.originalType=t,s[p]="string"==typeof t?t:o,i[1]=s;for(var u=2;u{n.r(e),n.d(e,{assets:()=>l,contentTitle:()=>i,default:()=>d,frontMatter:()=>a,metadata:()=>s,toc:()=>u});var r=n(7462),o=(n(7294),n(3905));const a={title:"Translations"},i=void 0,s={unversionedId:"usage/translations",id:"usage/translations",title:"Translations",description:"Default Translation task uses Whisper model ability to translate to English, however Large-V3-Turbo is not compatible with this standard. Since version 1.0.0 Buzz supports additional AI translations to any other language.",source:"@site/docs/usage/3_translations.md",sourceDirName:"usage",slug:"/usage/translations",permalink:"/buzz/docs/usage/translations",draft:!1,tags:[],version:"current",sidebarPosition:3,frontMatter:{title:"Translations"},sidebar:"tutorialSidebar",previous:{title:"Live Recording",permalink:"/buzz/docs/usage/live_recording"},next:{title:"Edit and Resize",permalink:"/buzz/docs/usage/edit_and_resize"}},l={},u=[],c={toc:u},p="wrapper";function d(t){let{components:e,...n}=t;return(0,o.kt)(p,(0,r.Z)({},c,n,{components:e,mdxType:"MDXLayout"}),(0,o.kt)("p",null,"Default ",(0,o.kt)("inlineCode",{parentName:"p"},"Translation")," task uses Whisper model ability to translate to English, however ",(0,o.kt)("inlineCode",{parentName:"p"},"Large-V3-Turbo")," is not compatible with this standard. Since version ",(0,o.kt)("inlineCode",{parentName:"p"},"1.0.0")," Buzz supports additional AI translations to any other language."),(0,o.kt)("p",null,"To use translation feature you will need to configure OpenAI API key and translation settings. Set OpenAI API ket in Preferences. Buzz also supports custom locally running translation AIs that support OpenAI API. For more information on locally running AIs see ",(0,o.kt)("a",{parentName:"p",href:"https://ollama.com/blog/openai-compatibility"},"ollama")," or ",(0,o.kt)("a",{parentName:"p",href:"https://lmstudio.ai/"},"LM Studio"),". For information on available custom APIs see this ",(0,o.kt)("a",{parentName:"p",href:"https://github.com/chidiwilliams/buzz/discussions/827"},"discussion thread"),"."),(0,o.kt)("p",null,"To configure translation for Live recordings enable it in Advances settings dialog of the Live Recording settings. Enter AI model to use and prompt with instructions for the AI on how to translate. Translation option is also available for files that already have speech recognised. Use Translate button on transcription viewer toolbar."),(0,o.kt)("p",null,'For AI to know how to translate enter translation instructions in the "Instructions for AI" section. In your instructions you should describe to what language you want it to translate the text to. Also, you may need to add additional instructions to not add any notes or comments as AIs tend to add them. Example instructions to translate English subtitles to Spanish:'),(0,o.kt)("blockquote",null,(0,o.kt)("p",{parentName:"blockquote"},"You are a professional translator, skilled in translating English to Spanish. You will only translate each sentence sent to you into Spanish and not add any notes or comments.")),(0,o.kt)("p",null,'If you enable "Enable live recording transcription export" in Preferences, Live text transcripts will be exported to a text file as they get generated and translated. This file can be used to further integrate Live transcripts with other applications like OBS Studio.'),(0,o.kt)("p",null,"Approximate cost of translation for 1 hour long audio with ChatGPT ",(0,o.kt)("inlineCode",{parentName:"p"},"gpt-4o")," model is around $0.50."))}d.isMDXComponent=!0}}]); \ No newline at end of file diff --git a/assets/js/36b603e5.6df0f804.js b/assets/js/36b603e5.55d4006f.js similarity index 75% rename from assets/js/36b603e5.6df0f804.js rename to assets/js/36b603e5.55d4006f.js index c445fa72..66f07e82 100644 --- a/assets/js/36b603e5.6df0f804.js +++ b/assets/js/36b603e5.55d4006f.js @@ -1 +1 @@ -"use strict";(self.webpackChunkdocs=self.webpackChunkdocs||[]).push([[559],{3905:(e,t,n)=>{n.d(t,{Zo:()=>c,kt:()=>f});var r=n(7294);function a(e,t,n){return t in e?Object.defineProperty(e,t,{value:n,enumerable:!0,configurable:!0,writable:!0}):e[t]=n,e}function i(e,t){var n=Object.keys(e);if(Object.getOwnPropertySymbols){var r=Object.getOwnPropertySymbols(e);t&&(r=r.filter((function(t){return Object.getOwnPropertyDescriptor(e,t).enumerable}))),n.push.apply(n,r)}return n}function l(e){for(var t=1;t=0||(a[n]=e[n]);return a}(e,t);if(Object.getOwnPropertySymbols){var i=Object.getOwnPropertySymbols(e);for(r=0;r=0||Object.prototype.propertyIsEnumerable.call(e,n)&&(a[n]=e[n])}return a}var p=r.createContext({}),s=function(e){var t=r.useContext(p),n=t;return e&&(n="function"==typeof e?e(t):l(l({},t),e)),n},c=function(e){var t=s(e.components);return r.createElement(p.Provider,{value:t},e.children)},u="mdxType",m={inlineCode:"code",wrapper:function(e){var t=e.children;return r.createElement(r.Fragment,{},t)}},d=r.forwardRef((function(e,t){var n=e.components,a=e.mdxType,i=e.originalType,p=e.parentName,c=o(e,["components","mdxType","originalType","parentName"]),u=s(n),d=a,f=u["".concat(p,".").concat(d)]||u[d]||m[d]||i;return n?r.createElement(f,l(l({ref:t},c),{},{components:n})):r.createElement(f,l({ref:t},c))}));function f(e,t){var n=arguments,a=t&&t.mdxType;if("string"==typeof e||a){var i=n.length,l=new Array(i);l[0]=d;var o={};for(var p in t)hasOwnProperty.call(t,p)&&(o[p]=t[p]);o.originalType=e,o[u]="string"==typeof e?e:a,l[1]=o;for(var s=2;s{n.r(t),n.d(t,{assets:()=>p,contentTitle:()=>l,default:()=>m,frontMatter:()=>i,metadata:()=>o,toc:()=>s});var r=n(7462),a=(n(7294),n(3905));const i={title:"File Import"},l=void 0,o={unversionedId:"usage/file_import",id:"usage/file_import",title:"File Import",description:"To import a file:",source:"@site/docs/usage/1_file_import.md",sourceDirName:"usage",slug:"/usage/file_import",permalink:"/buzz/docs/usage/file_import",draft:!1,tags:[],version:"current",sidebarPosition:1,frontMatter:{title:"File Import"},sidebar:"tutorialSidebar",previous:{title:"Installation",permalink:"/buzz/docs/installation"},next:{title:"Live Recording",permalink:"/buzz/docs/usage/live_recording"}},p={},s=[],c={toc:s},u="wrapper";function m(e){let{components:t,...n}=e;return(0,a.kt)(u,(0,r.Z)({},c,n,{components:t,mdxType:"MDXLayout"}),(0,a.kt)("p",null,(0,a.kt)("strong",{parentName:"p"},"To import a file:")),(0,a.kt)("ul",null,(0,a.kt)("li",{parentName:"ul"},"Click Import Media File on the File menu (or the '+' icon on the toolbar, or ",(0,a.kt)("strong",{parentName:"li"},"Command/Ctrl + O"),")."),(0,a.kt)("li",{parentName:"ul"},"Choose an audio or video file."),(0,a.kt)("li",{parentName:"ul"},"Select a task, language, and the model settings."),(0,a.kt)("li",{parentName:"ul"},"Click Run."),(0,a.kt)("li",{parentName:"ul"},"When the transcription status shows 'Completed', double-click on the row (or select the row and click the '\u2922' icon) to\nopen the transcription.")),(0,a.kt)("p",null,(0,a.kt)("strong",{parentName:"p"},"Available options:")),(0,a.kt)("p",null,"To reduce misspellings you can pass some commonly misspelled words in an ",(0,a.kt)("inlineCode",{parentName:"p"},"Initial prompt")," that is available under ",(0,a.kt)("inlineCode",{parentName:"p"},"Advanced...")," button. See this ",(0,a.kt)("a",{parentName:"p",href:"https://cookbook.openai.com/examples/whisper_prompting_guide#pass-names-in-the-prompt-to-prevent-misspellings"},"guide on prompting"),". "),(0,a.kt)("table",null,(0,a.kt)("thead",{parentName:"table"},(0,a.kt)("tr",{parentName:"thead"},(0,a.kt)("th",{parentName:"tr",align:null},"Field"),(0,a.kt)("th",{parentName:"tr",align:null},"Options"),(0,a.kt)("th",{parentName:"tr",align:null},"Default"),(0,a.kt)("th",{parentName:"tr",align:null},"Description"))),(0,a.kt)("tbody",{parentName:"table"},(0,a.kt)("tr",{parentName:"tbody"},(0,a.kt)("td",{parentName:"tr",align:null},"Export As"),(0,a.kt)("td",{parentName:"tr",align:null},'"TXT", "SRT", "VTT"'),(0,a.kt)("td",{parentName:"tr",align:null},'"TXT"'),(0,a.kt)("td",{parentName:"tr",align:null},"Export file format")),(0,a.kt)("tr",{parentName:"tbody"},(0,a.kt)("td",{parentName:"tr",align:null},"Word-Level Timings"),(0,a.kt)("td",{parentName:"tr",align:null},"Off / On"),(0,a.kt)("td",{parentName:"tr",align:null},"Off"),(0,a.kt)("td",{parentName:"tr",align:null},"If checked, the transcription will generate a separate subtitle line for each word in the audio. Combine words into subtitles afterwards with the ",(0,a.kt)("a",{parentName:"td",href:"https://chidiwilliams.github.io/buzz/docs/usage/edit_and_resize"},"resize option"),".")),(0,a.kt)("tr",{parentName:"tbody"},(0,a.kt)("td",{parentName:"tr",align:null},"Extract speech"),(0,a.kt)("td",{parentName:"tr",align:null},"Off / On"),(0,a.kt)("td",{parentName:"tr",align:null},"Off"),(0,a.kt)("td",{parentName:"tr",align:null},"If checked, speech will be extracted to a separate audio tack to improve accuracy. Available since 1.3.0.")))),(0,a.kt)("p",null,"(See the ",(0,a.kt)("a",{parentName:"p",href:"https://chidiwilliams.github.io/buzz/docs/usage/live_recording"},"Live Recording section")," for more information about the task, language, and quality settings.)"),(0,a.kt)("p",null,(0,a.kt)("a",{parentName:"p",href:"https://www.loom.com/share/cf263b099ac3481082bb56d19b7c87fe",title:"Media File Import on Buzz"},(0,a.kt)("img",{parentName:"a",src:"https://cdn.loom.com/sessions/thumbnails/cf263b099ac3481082bb56d19b7c87fe-with-play.gif",alt:"Media File Import on Buzz"}))),(0,a.kt)("p",null,(0,a.kt)("strong",{parentName:"p"},"\ud83d\udca1 Tip:")," It is recommended to always select language to transcribe to as automatic language detection may result in unexpected results."))}m.isMDXComponent=!0}}]); \ No newline at end of file +"use strict";(self.webpackChunkdocs=self.webpackChunkdocs||[]).push([[559],{3905:(e,t,n)=>{n.d(t,{Zo:()=>c,kt:()=>f});var r=n(7294);function a(e,t,n){return t in e?Object.defineProperty(e,t,{value:n,enumerable:!0,configurable:!0,writable:!0}):e[t]=n,e}function i(e,t){var n=Object.keys(e);if(Object.getOwnPropertySymbols){var r=Object.getOwnPropertySymbols(e);t&&(r=r.filter((function(t){return Object.getOwnPropertyDescriptor(e,t).enumerable}))),n.push.apply(n,r)}return n}function o(e){for(var t=1;t=0||(a[n]=e[n]);return a}(e,t);if(Object.getOwnPropertySymbols){var i=Object.getOwnPropertySymbols(e);for(r=0;r=0||Object.prototype.propertyIsEnumerable.call(e,n)&&(a[n]=e[n])}return a}var p=r.createContext({}),s=function(e){var t=r.useContext(p),n=t;return e&&(n="function"==typeof e?e(t):o(o({},t),e)),n},c=function(e){var t=s(e.components);return r.createElement(p.Provider,{value:t},e.children)},u="mdxType",m={inlineCode:"code",wrapper:function(e){var t=e.children;return r.createElement(r.Fragment,{},t)}},d=r.forwardRef((function(e,t){var n=e.components,a=e.mdxType,i=e.originalType,p=e.parentName,c=l(e,["components","mdxType","originalType","parentName"]),u=s(n),d=a,f=u["".concat(p,".").concat(d)]||u[d]||m[d]||i;return n?r.createElement(f,o(o({ref:t},c),{},{components:n})):r.createElement(f,o({ref:t},c))}));function f(e,t){var n=arguments,a=t&&t.mdxType;if("string"==typeof e||a){var i=n.length,o=new Array(i);o[0]=d;var l={};for(var p in t)hasOwnProperty.call(t,p)&&(l[p]=t[p]);l.originalType=e,l[u]="string"==typeof e?e:a,o[1]=l;for(var s=2;s{n.r(t),n.d(t,{assets:()=>p,contentTitle:()=>o,default:()=>m,frontMatter:()=>i,metadata:()=>l,toc:()=>s});var r=n(7462),a=(n(7294),n(3905));const i={title:"File Import"},o=void 0,l={unversionedId:"usage/file_import",id:"usage/file_import",title:"File Import",description:"To import a file:",source:"@site/docs/usage/1_file_import.md",sourceDirName:"usage",slug:"/usage/file_import",permalink:"/buzz/docs/usage/file_import",draft:!1,tags:[],version:"current",sidebarPosition:1,frontMatter:{title:"File Import"},sidebar:"tutorialSidebar",previous:{title:"Installation",permalink:"/buzz/docs/installation"},next:{title:"Live Recording",permalink:"/buzz/docs/usage/live_recording"}},p={},s=[],c={toc:s},u="wrapper";function m(e){let{components:t,...n}=e;return(0,a.kt)(u,(0,r.Z)({},c,n,{components:t,mdxType:"MDXLayout"}),(0,a.kt)("p",null,(0,a.kt)("strong",{parentName:"p"},"To import a file:")),(0,a.kt)("ul",null,(0,a.kt)("li",{parentName:"ul"},"Click Import Media File on the File menu (or the '+' icon on the toolbar, or ",(0,a.kt)("strong",{parentName:"li"},"Command/Ctrl + O"),")."),(0,a.kt)("li",{parentName:"ul"},"Choose an audio or video file."),(0,a.kt)("li",{parentName:"ul"},"Select a task, language, and the model settings."),(0,a.kt)("li",{parentName:"ul"},"Click Run."),(0,a.kt)("li",{parentName:"ul"},"When the transcription status shows 'Completed', double-click on the row (or select the row and click the '\u2922' icon) to\nopen the transcription.")),(0,a.kt)("p",null,(0,a.kt)("strong",{parentName:"p"},"Available options:")),(0,a.kt)("p",null,"To reduce misspellings you can pass some commonly misspelled words in an ",(0,a.kt)("inlineCode",{parentName:"p"},"Initial prompt")," that is available under ",(0,a.kt)("inlineCode",{parentName:"p"},"Advanced...")," button. See this ",(0,a.kt)("a",{parentName:"p",href:"https://cookbook.openai.com/examples/whisper_prompting_guide#pass-names-in-the-prompt-to-prevent-misspellings"},"guide on prompting"),". "),(0,a.kt)("table",null,(0,a.kt)("thead",{parentName:"table"},(0,a.kt)("tr",{parentName:"thead"},(0,a.kt)("th",{parentName:"tr",align:null},"Field"),(0,a.kt)("th",{parentName:"tr",align:null},"Options"),(0,a.kt)("th",{parentName:"tr",align:null},"Default"),(0,a.kt)("th",{parentName:"tr",align:null},"Description"))),(0,a.kt)("tbody",{parentName:"table"},(0,a.kt)("tr",{parentName:"tbody"},(0,a.kt)("td",{parentName:"tr",align:null},"Export As"),(0,a.kt)("td",{parentName:"tr",align:null},'"TXT", "SRT", "VTT"'),(0,a.kt)("td",{parentName:"tr",align:null},'"TXT"'),(0,a.kt)("td",{parentName:"tr",align:null},"Export file format")),(0,a.kt)("tr",{parentName:"tbody"},(0,a.kt)("td",{parentName:"tr",align:null},"Word-Level Timings"),(0,a.kt)("td",{parentName:"tr",align:null},"Off / On"),(0,a.kt)("td",{parentName:"tr",align:null},"Off"),(0,a.kt)("td",{parentName:"tr",align:null},"If checked, the transcription will generate a separate subtitle line for each word in the audio. Combine words into subtitles afterwards with the ",(0,a.kt)("a",{parentName:"td",href:"https://chidiwilliams.github.io/buzz/docs/usage/edit_and_resize"},"resize option"),".")),(0,a.kt)("tr",{parentName:"tbody"},(0,a.kt)("td",{parentName:"tr",align:null},"Extract speech"),(0,a.kt)("td",{parentName:"tr",align:null},"Off / On"),(0,a.kt)("td",{parentName:"tr",align:null},"Off"),(0,a.kt)("td",{parentName:"tr",align:null},"If checked, speech will be extracted to a separate audio tack to improve accuracy.")))),(0,a.kt)("p",null,"(See the ",(0,a.kt)("a",{parentName:"p",href:"https://chidiwilliams.github.io/buzz/docs/usage/live_recording"},"Live Recording section")," for more information about the task, language, and quality settings.)"),(0,a.kt)("p",null,(0,a.kt)("a",{parentName:"p",href:"https://www.loom.com/share/cf263b099ac3481082bb56d19b7c87fe",title:"Media File Import on Buzz"},(0,a.kt)("img",{parentName:"a",src:"https://cdn.loom.com/sessions/thumbnails/cf263b099ac3481082bb56d19b7c87fe-with-play.gif",alt:"Media File Import on Buzz"}))),(0,a.kt)("p",null,(0,a.kt)("strong",{parentName:"p"},"\ud83d\udca1 Tip:")," It is recommended to always select language to transcribe to as automatic language detection may result in unexpected results."))}m.isMDXComponent=!0}}]); \ No newline at end of file diff --git a/assets/js/409b9ecc.7778f743.js b/assets/js/409b9ecc.b74554d9.js similarity index 88% rename from assets/js/409b9ecc.7778f743.js rename to assets/js/409b9ecc.b74554d9.js index 0ca734c3..ddb44128 100644 --- a/assets/js/409b9ecc.7778f743.js +++ b/assets/js/409b9ecc.b74554d9.js @@ -1 +1 @@ -"use strict";(self.webpackChunkdocs=self.webpackChunkdocs||[]).push([[697],{3905:(e,t,n)=>{n.d(t,{Zo:()=>u,kt:()=>m});var r=n(7294);function i(e,t,n){return t in e?Object.defineProperty(e,t,{value:n,enumerable:!0,configurable:!0,writable:!0}):e[t]=n,e}function o(e,t){var n=Object.keys(e);if(Object.getOwnPropertySymbols){var r=Object.getOwnPropertySymbols(e);t&&(r=r.filter((function(t){return Object.getOwnPropertyDescriptor(e,t).enumerable}))),n.push.apply(n,r)}return n}function a(e){for(var t=1;t=0||(i[n]=e[n]);return i}(e,t);if(Object.getOwnPropertySymbols){var o=Object.getOwnPropertySymbols(e);for(r=0;r=0||Object.prototype.propertyIsEnumerable.call(e,n)&&(i[n]=e[n])}return i}var l=r.createContext({}),c=function(e){var t=r.useContext(l),n=t;return e&&(n="function"==typeof e?e(t):a(a({},t),e)),n},u=function(e){var t=c(e.components);return r.createElement(l.Provider,{value:t},e.children)},p="mdxType",d={inlineCode:"code",wrapper:function(e){var t=e.children;return r.createElement(r.Fragment,{},t)}},f=r.forwardRef((function(e,t){var n=e.components,i=e.mdxType,o=e.originalType,l=e.parentName,u=s(e,["components","mdxType","originalType","parentName"]),p=c(n),f=i,m=p["".concat(l,".").concat(f)]||p[f]||d[f]||o;return n?r.createElement(m,a(a({ref:t},u),{},{components:n})):r.createElement(m,a({ref:t},u))}));function m(e,t){var n=arguments,i=t&&t.mdxType;if("string"==typeof e||i){var o=n.length,a=new Array(o);a[0]=f;var s={};for(var l in t)hasOwnProperty.call(t,l)&&(s[l]=t[l]);s.originalType=e,s[p]="string"==typeof e?e:i,a[1]=s;for(var c=2;c{n.r(t),n.d(t,{assets:()=>l,contentTitle:()=>a,default:()=>d,frontMatter:()=>o,metadata:()=>s,toc:()=>c});var r=n(7462),i=(n(7294),n(3905));const o={title:"Edit and Resize"},a=void 0,s={unversionedId:"usage/edit_and_resize",id:"usage/edit_and_resize",title:"Edit and Resize",description:"Resize options",source:"@site/docs/usage/4_edit_and_resize.md",sourceDirName:"usage",slug:"/usage/edit_and_resize",permalink:"/buzz/docs/usage/edit_and_resize",draft:!1,tags:[],version:"current",sidebarPosition:4,frontMatter:{title:"Edit and Resize"},sidebar:"tutorialSidebar",previous:{title:"Translations",permalink:"/buzz/docs/usage/translations"},next:{title:"Speaker identification",permalink:"/buzz/docs/usage/speaker_identification"}},l={},c=[],u={toc:c},p="wrapper";function d(e){let{components:t,...n}=e;return(0,i.kt)(p,(0,r.Z)({},u,n,{components:t,mdxType:"MDXLayout"}),(0,i.kt)("p",null,(0,i.kt)("a",{parentName:"p",href:"https://www.loom.com/share/cf263b099ac3481082bb56d19b7c87fe",title:"Resize options"},(0,i.kt)("img",{parentName:"a",src:"https://raw.githubusercontent.com/chidiwilliams/buzz/main/share/screenshots/buzz-6-resize.png",alt:"Resize options"}))),(0,i.kt)("p",null,"When transcript of some audio or video file is generated you can edit it and export to different subtitle formats or plain text. Double-click the transcript in the list of transcripts to see additional options for editing and exporting."),(0,i.kt)("p",null,'Transcription view screen has option to resize the transcripts. Click on the "Resize" button so see available options. Transcripts that have been generated ',(0,i.kt)("strong",{parentName:"p"},"with word-level timings")," setting enabled can be combined into subtitles specifying different options, like maximum length of a subtitle and if subtitles should be split on punctuation. For transcripts that have been generated ",(0,i.kt)("strong",{parentName:"p"},"without word-level timings")," setting enabled can only be recombined specifying desired max length of a subtitle. "),(0,i.kt)("p",null,"If audio file is still present on the system word-level timing merge will also analyze the audio for silences to improve subtitle accuracy. Subtitle generation from transcripts with word-level timings is available since version 1.3.0."),(0,i.kt)("p",null,"The resize tool also has an option to extend end time of segments if you want the subtitles to be on the screen for longer. You can specify the amount of time in seconds to extend each subtitle segment. Buzz will add this amount of time to the end of each subtitle segment making sure that the end of a segment does not go over start of the next segment. This feature is available since 1.4.3."))}d.isMDXComponent=!0}}]); \ No newline at end of file +"use strict";(self.webpackChunkdocs=self.webpackChunkdocs||[]).push([[697],{3905:(e,t,n)=>{n.d(t,{Zo:()=>u,kt:()=>m});var r=n(7294);function i(e,t,n){return t in e?Object.defineProperty(e,t,{value:n,enumerable:!0,configurable:!0,writable:!0}):e[t]=n,e}function o(e,t){var n=Object.keys(e);if(Object.getOwnPropertySymbols){var r=Object.getOwnPropertySymbols(e);t&&(r=r.filter((function(t){return Object.getOwnPropertyDescriptor(e,t).enumerable}))),n.push.apply(n,r)}return n}function a(e){for(var t=1;t=0||(i[n]=e[n]);return i}(e,t);if(Object.getOwnPropertySymbols){var o=Object.getOwnPropertySymbols(e);for(r=0;r=0||Object.prototype.propertyIsEnumerable.call(e,n)&&(i[n]=e[n])}return i}var l=r.createContext({}),c=function(e){var t=r.useContext(l),n=t;return e&&(n="function"==typeof e?e(t):a(a({},t),e)),n},u=function(e){var t=c(e.components);return r.createElement(l.Provider,{value:t},e.children)},p="mdxType",d={inlineCode:"code",wrapper:function(e){var t=e.children;return r.createElement(r.Fragment,{},t)}},f=r.forwardRef((function(e,t){var n=e.components,i=e.mdxType,o=e.originalType,l=e.parentName,u=s(e,["components","mdxType","originalType","parentName"]),p=c(n),f=i,m=p["".concat(l,".").concat(f)]||p[f]||d[f]||o;return n?r.createElement(m,a(a({ref:t},u),{},{components:n})):r.createElement(m,a({ref:t},u))}));function m(e,t){var n=arguments,i=t&&t.mdxType;if("string"==typeof e||i){var o=n.length,a=new Array(o);a[0]=f;var s={};for(var l in t)hasOwnProperty.call(t,l)&&(s[l]=t[l]);s.originalType=e,s[p]="string"==typeof e?e:i,a[1]=s;for(var c=2;c{n.r(t),n.d(t,{assets:()=>l,contentTitle:()=>a,default:()=>d,frontMatter:()=>o,metadata:()=>s,toc:()=>c});var r=n(7462),i=(n(7294),n(3905));const o={title:"Edit and Resize"},a=void 0,s={unversionedId:"usage/edit_and_resize",id:"usage/edit_and_resize",title:"Edit and Resize",description:"Resize options",source:"@site/docs/usage/4_edit_and_resize.md",sourceDirName:"usage",slug:"/usage/edit_and_resize",permalink:"/buzz/docs/usage/edit_and_resize",draft:!1,tags:[],version:"current",sidebarPosition:4,frontMatter:{title:"Edit and Resize"},sidebar:"tutorialSidebar",previous:{title:"Translations",permalink:"/buzz/docs/usage/translations"},next:{title:"Speaker identification",permalink:"/buzz/docs/usage/speaker_identification"}},l={},c=[],u={toc:c},p="wrapper";function d(e){let{components:t,...n}=e;return(0,i.kt)(p,(0,r.Z)({},u,n,{components:t,mdxType:"MDXLayout"}),(0,i.kt)("p",null,(0,i.kt)("a",{parentName:"p",href:"https://www.loom.com/share/cf263b099ac3481082bb56d19b7c87fe",title:"Resize options"},(0,i.kt)("img",{parentName:"a",src:"https://raw.githubusercontent.com/chidiwilliams/buzz/main/share/screenshots/buzz-6-resize.png",alt:"Resize options"}))),(0,i.kt)("p",null,"When transcript of some audio or video file is generated you can edit it and export to different subtitle formats or plain text. Double-click the transcript in the list of transcripts to see additional options for editing and exporting."),(0,i.kt)("p",null,'Transcription view screen has option to resize the transcripts. Click on the "Resize" button so see available options. Transcripts that have been generated ',(0,i.kt)("strong",{parentName:"p"},"with word-level timings")," setting enabled can be combined into subtitles specifying different options, like maximum length of a subtitle and if subtitles should be split on punctuation. For transcripts that have been generated ",(0,i.kt)("strong",{parentName:"p"},"without word-level timings")," setting enabled can only be recombined specifying desired max length of a subtitle. "),(0,i.kt)("p",null,"If audio file is still present on the system word-level timing merge will also analyze the audio for silences to improve subtitle accuracy. "),(0,i.kt)("p",null,"The resize tool also has an option to extend end time of segments if you want the subtitles to be on the screen for longer. You can specify the amount of time in seconds to extend each subtitle segment. Buzz will add this amount of time to the end of each subtitle segment making sure that the end of a segment does not go over start of the next segment. This feature is available since 1.4.3."))}d.isMDXComponent=!0}}]); \ No newline at end of file diff --git a/assets/js/6ec58200.8170897d.js b/assets/js/6ec58200.a3addc77.js similarity index 97% rename from assets/js/6ec58200.8170897d.js rename to assets/js/6ec58200.a3addc77.js index 54b261f3..d686cb76 100644 --- a/assets/js/6ec58200.8170897d.js +++ b/assets/js/6ec58200.a3addc77.js @@ -1 +1 @@ -"use strict";(self.webpackChunkdocs=self.webpackChunkdocs||[]).push([[150],{3905:(e,t,n)=>{n.d(t,{Zo:()=>l,kt:()=>m});var r=n(7294);function i(e,t,n){return t in e?Object.defineProperty(e,t,{value:n,enumerable:!0,configurable:!0,writable:!0}):e[t]=n,e}function a(e,t){var n=Object.keys(e);if(Object.getOwnPropertySymbols){var r=Object.getOwnPropertySymbols(e);t&&(r=r.filter((function(t){return Object.getOwnPropertyDescriptor(e,t).enumerable}))),n.push.apply(n,r)}return n}function o(e){for(var t=1;t=0||(i[n]=e[n]);return i}(e,t);if(Object.getOwnPropertySymbols){var a=Object.getOwnPropertySymbols(e);for(r=0;r=0||Object.prototype.propertyIsEnumerable.call(e,n)&&(i[n]=e[n])}return i}var c=r.createContext({}),p=function(e){var t=r.useContext(c),n=t;return e&&(n="function"==typeof e?e(t):o(o({},t),e)),n},l=function(e){var t=p(e.components);return r.createElement(c.Provider,{value:t},e.children)},u="mdxType",d={inlineCode:"code",wrapper:function(e){var t=e.children;return r.createElement(r.Fragment,{},t)}},f=r.forwardRef((function(e,t){var n=e.components,i=e.mdxType,a=e.originalType,c=e.parentName,l=s(e,["components","mdxType","originalType","parentName"]),u=p(n),f=i,m=u["".concat(c,".").concat(f)]||u[f]||d[f]||a;return n?r.createElement(m,o(o({ref:t},l),{},{components:n})):r.createElement(m,o({ref:t},l))}));function m(e,t){var n=arguments,i=t&&t.mdxType;if("string"==typeof e||i){var a=n.length,o=new Array(a);o[0]=f;var s={};for(var c in t)hasOwnProperty.call(t,c)&&(s[c]=t[c]);s.originalType=e,s[u]="string"==typeof e?e:i,o[1]=s;for(var p=2;p{n.r(t),n.d(t,{assets:()=>c,contentTitle:()=>o,default:()=>d,frontMatter:()=>a,metadata:()=>s,toc:()=>p});var r=n(7462),i=(n(7294),n(3905));const a={title:"Speaker identification"},o=void 0,s={unversionedId:"usage/speaker_identification",id:"usage/speaker_identification",title:"Speaker identification",description:"When transcript of some audio or video file is generated you can identify speakers in the transcript. Double-click the transcript in the list of transcripts to see additional options for editing and exporting.",source:"@site/docs/usage/5_speaker_identification.md",sourceDirName:"usage",slug:"/usage/speaker_identification",permalink:"/buzz/docs/usage/speaker_identification",draft:!1,tags:[],version:"current",sidebarPosition:5,frontMatter:{title:"Speaker identification"},sidebar:"tutorialSidebar",previous:{title:"Edit and Resize",permalink:"/buzz/docs/usage/edit_and_resize"},next:{title:"Transcription Viewer",permalink:"/buzz/docs/usage/transcription_viewer"}},c={},p=[],l={toc:p},u="wrapper";function d(e){let{components:t,...n}=e;return(0,i.kt)(u,(0,r.Z)({},l,n,{components:t,mdxType:"MDXLayout"}),(0,i.kt)("p",null,"When transcript of some audio or video file is generated you can identify speakers in the transcript. Double-click the transcript in the list of transcripts to see additional options for editing and exporting."),(0,i.kt)("p",null,'Transcription view screen has option to identify speakers. Click on the "Identify speakers" button so see available options. '),(0,i.kt)("p",null,'If audio file is still present on the system speaker identification will mark each speakers sentences with appropriate label. You can preview 10 seconds of some random sentence of the identified speaker and rename the automatically identified label to speakers real name. If "Merge speaker sentences" checkbox is selected when you save the speaker labels, all consecutive sentences of the same speaker will be merged into one segment. Speaker identification is available since version 1.4.0 on all platforms except Intel macOS.'))}d.isMDXComponent=!0}}]); \ No newline at end of file +"use strict";(self.webpackChunkdocs=self.webpackChunkdocs||[]).push([[150],{3905:(e,t,n)=>{n.d(t,{Zo:()=>l,kt:()=>m});var r=n(7294);function i(e,t,n){return t in e?Object.defineProperty(e,t,{value:n,enumerable:!0,configurable:!0,writable:!0}):e[t]=n,e}function a(e,t){var n=Object.keys(e);if(Object.getOwnPropertySymbols){var r=Object.getOwnPropertySymbols(e);t&&(r=r.filter((function(t){return Object.getOwnPropertyDescriptor(e,t).enumerable}))),n.push.apply(n,r)}return n}function o(e){for(var t=1;t=0||(i[n]=e[n]);return i}(e,t);if(Object.getOwnPropertySymbols){var a=Object.getOwnPropertySymbols(e);for(r=0;r=0||Object.prototype.propertyIsEnumerable.call(e,n)&&(i[n]=e[n])}return i}var c=r.createContext({}),p=function(e){var t=r.useContext(c),n=t;return e&&(n="function"==typeof e?e(t):o(o({},t),e)),n},l=function(e){var t=p(e.components);return r.createElement(c.Provider,{value:t},e.children)},u="mdxType",d={inlineCode:"code",wrapper:function(e){var t=e.children;return r.createElement(r.Fragment,{},t)}},f=r.forwardRef((function(e,t){var n=e.components,i=e.mdxType,a=e.originalType,c=e.parentName,l=s(e,["components","mdxType","originalType","parentName"]),u=p(n),f=i,m=u["".concat(c,".").concat(f)]||u[f]||d[f]||a;return n?r.createElement(m,o(o({ref:t},l),{},{components:n})):r.createElement(m,o({ref:t},l))}));function m(e,t){var n=arguments,i=t&&t.mdxType;if("string"==typeof e||i){var a=n.length,o=new Array(a);o[0]=f;var s={};for(var c in t)hasOwnProperty.call(t,c)&&(s[c]=t[c]);s.originalType=e,s[u]="string"==typeof e?e:i,o[1]=s;for(var p=2;p{n.r(t),n.d(t,{assets:()=>c,contentTitle:()=>o,default:()=>d,frontMatter:()=>a,metadata:()=>s,toc:()=>p});var r=n(7462),i=(n(7294),n(3905));const a={title:"Speaker identification"},o=void 0,s={unversionedId:"usage/speaker_identification",id:"usage/speaker_identification",title:"Speaker identification",description:"When transcript of some audio or video file is generated you can identify speakers in the transcript. Double-click the transcript in the list of transcripts to see additional options for editing and exporting.",source:"@site/docs/usage/5_speaker_identification.md",sourceDirName:"usage",slug:"/usage/speaker_identification",permalink:"/buzz/docs/usage/speaker_identification",draft:!1,tags:[],version:"current",sidebarPosition:5,frontMatter:{title:"Speaker identification"},sidebar:"tutorialSidebar",previous:{title:"Edit and Resize",permalink:"/buzz/docs/usage/edit_and_resize"},next:{title:"Transcription Viewer",permalink:"/buzz/docs/usage/transcription_viewer"}},c={},p=[],l={toc:p},u="wrapper";function d(e){let{components:t,...n}=e;return(0,i.kt)(u,(0,r.Z)({},l,n,{components:t,mdxType:"MDXLayout"}),(0,i.kt)("p",null,"When transcript of some audio or video file is generated you can identify speakers in the transcript. Double-click the transcript in the list of transcripts to see additional options for editing and exporting."),(0,i.kt)("p",null,'Transcription view screen has option to identify speakers. Click on the "Identify speakers" button so see available options. '),(0,i.kt)("p",null,'If audio file is still present on the system speaker identification will mark each speakers sentences with appropriate label. You can preview 10 seconds of some random sentence of the identified speaker and rename the automatically identified label to speakers real name. If "Merge speaker sentences" checkbox is selected when you save the speaker labels, all consecutive sentences of the same speaker will be merged into one segment. Speaker identification is not available on Intel macOS.'))}d.isMDXComponent=!0}}]); \ No newline at end of file diff --git a/assets/js/935f2afb.15830391.js b/assets/js/935f2afb.d422329a.js similarity index 96% rename from assets/js/935f2afb.15830391.js rename to assets/js/935f2afb.d422329a.js index 5f022461..d83792dc 100644 --- a/assets/js/935f2afb.15830391.js +++ b/assets/js/935f2afb.d422329a.js @@ -1 +1 @@ -"use strict";(self.webpackChunkdocs=self.webpackChunkdocs||[]).push([[53],{1109:e=>{e.exports=JSON.parse('{"pluginId":"default","version":"current","label":"Next","banner":null,"badge":false,"noIndex":false,"className":"docs-version-current","isLast":true,"docsSidebars":{"tutorialSidebar":[{"type":"link","label":"Introduction","href":"/buzz/docs/","docId":"index"},{"type":"link","label":"Installation","href":"/buzz/docs/installation","docId":"installation"},{"type":"category","label":"Usage","collapsible":true,"collapsed":true,"items":[{"type":"link","label":"File Import","href":"/buzz/docs/usage/file_import","docId":"usage/file_import"},{"type":"link","label":"Live Recording","href":"/buzz/docs/usage/live_recording","docId":"usage/live_recording"},{"type":"link","label":"Translations","href":"/buzz/docs/usage/translations","docId":"usage/translations"},{"type":"link","label":"Edit and Resize","href":"/buzz/docs/usage/edit_and_resize","docId":"usage/edit_and_resize"},{"type":"link","label":"Speaker identification","href":"/buzz/docs/usage/speaker_identification","docId":"usage/speaker_identification"},{"type":"link","label":"Transcription Viewer","href":"/buzz/docs/usage/transcription_viewer","docId":"usage/transcription_viewer"}]},{"type":"link","label":"Preferences","href":"/buzz/docs/preferences","docId":"preferences"},{"type":"link","label":"CLI","href":"/buzz/docs/cli","docId":"cli"},{"type":"link","label":"FAQ","href":"/buzz/docs/faq","docId":"faq"}]},"docs":{"cli":{"id":"cli","title":"CLI","description":"Commands","sidebar":"tutorialSidebar"},"faq":{"id":"faq","title":"FAQ","description":"1. Where are the models stored?","sidebar":"tutorialSidebar"},"index":{"id":"index","title":"Introduction","description":"Transcribe and translate audio offline on your personal computer. Powered by","sidebar":"tutorialSidebar"},"installation":{"id":"installation","title":"Installation","description":"To install Buzz, download the latest version for your operating","sidebar":"tutorialSidebar"},"preferences":{"id":"preferences","title":"Preferences","description":"Open the Preferences window from the Menu bar, or click Ctrl/Cmd + ,.","sidebar":"tutorialSidebar"},"usage/edit_and_resize":{"id":"usage/edit_and_resize","title":"Edit and Resize","description":"Resize options","sidebar":"tutorialSidebar"},"usage/file_import":{"id":"usage/file_import","title":"File Import","description":"To import a file:","sidebar":"tutorialSidebar"},"usage/live_recording":{"id":"usage/live_recording","title":"Live Recording","description":"To start a live recording:","sidebar":"tutorialSidebar"},"usage/speaker_identification":{"id":"usage/speaker_identification","title":"Speaker identification","description":"When transcript of some audio or video file is generated you can identify speakers in the transcript. Double-click the transcript in the list of transcripts to see additional options for editing and exporting.","sidebar":"tutorialSidebar"},"usage/transcription_viewer":{"id":"usage/transcription_viewer","title":"Transcription Viewer","description":"The Buzz transcription viewer provides a powerful interface for reviewing, editing, and navigating through your transcriptions. This guide covers all the features available in the transcription viewer.","sidebar":"tutorialSidebar"},"usage/translations":{"id":"usage/translations","title":"Translations","description":"Default Translation task uses Whisper model ability to translate to English, however Large-V3-Turbo is not compatible with this standard. Since version 1.0.0 Buzz supports additional AI translations to any other language.","sidebar":"tutorialSidebar"}}}')}}]); \ No newline at end of file +"use strict";(self.webpackChunkdocs=self.webpackChunkdocs||[]).push([[53],{1109:e=>{e.exports=JSON.parse('{"pluginId":"default","version":"current","label":"Next","banner":null,"badge":false,"noIndex":false,"className":"docs-version-current","isLast":true,"docsSidebars":{"tutorialSidebar":[{"type":"link","label":"Introduction","href":"/buzz/docs/","docId":"index"},{"type":"link","label":"Installation","href":"/buzz/docs/installation","docId":"installation"},{"type":"category","label":"Usage","collapsible":true,"collapsed":true,"items":[{"type":"link","label":"File Import","href":"/buzz/docs/usage/file_import","docId":"usage/file_import"},{"type":"link","label":"Live Recording","href":"/buzz/docs/usage/live_recording","docId":"usage/live_recording"},{"type":"link","label":"Translations","href":"/buzz/docs/usage/translations","docId":"usage/translations"},{"type":"link","label":"Edit and Resize","href":"/buzz/docs/usage/edit_and_resize","docId":"usage/edit_and_resize"},{"type":"link","label":"Speaker identification","href":"/buzz/docs/usage/speaker_identification","docId":"usage/speaker_identification"},{"type":"link","label":"Transcription Viewer","href":"/buzz/docs/usage/transcription_viewer","docId":"usage/transcription_viewer"}]},{"type":"link","label":"Preferences","href":"/buzz/docs/preferences","docId":"preferences"},{"type":"link","label":"CLI","href":"/buzz/docs/cli","docId":"cli"},{"type":"link","label":"FAQ","href":"/buzz/docs/faq","docId":"faq"}]},"docs":{"cli":{"id":"cli","title":"CLI","description":"Commands","sidebar":"tutorialSidebar"},"faq":{"id":"faq","title":"FAQ","description":"1. Where are the models stored?","sidebar":"tutorialSidebar"},"index":{"id":"index","title":"Introduction","description":"Transcribe and translate audio offline on your personal computer. Powered by","sidebar":"tutorialSidebar"},"installation":{"id":"installation","title":"Installation","description":"To install Buzz, download the latest version for your operating","sidebar":"tutorialSidebar"},"preferences":{"id":"preferences","title":"Preferences","description":"Open the Preferences window from the Menu bar, or click Ctrl/Cmd + ,.","sidebar":"tutorialSidebar"},"usage/edit_and_resize":{"id":"usage/edit_and_resize","title":"Edit and Resize","description":"Resize options","sidebar":"tutorialSidebar"},"usage/file_import":{"id":"usage/file_import","title":"File Import","description":"To import a file:","sidebar":"tutorialSidebar"},"usage/live_recording":{"id":"usage/live_recording","title":"Live Recording","description":"To start a live recording:","sidebar":"tutorialSidebar"},"usage/speaker_identification":{"id":"usage/speaker_identification","title":"Speaker identification","description":"When transcript of some audio or video file is generated you can identify speakers in the transcript. Double-click the transcript in the list of transcripts to see additional options for editing and exporting.","sidebar":"tutorialSidebar"},"usage/transcription_viewer":{"id":"usage/transcription_viewer","title":"Transcription Viewer","description":"The Buzz transcription viewer provides a powerful interface for reviewing, editing, and navigating through your transcriptions. This guide covers all the features available in the transcription viewer.","sidebar":"tutorialSidebar"},"usage/translations":{"id":"usage/translations","title":"Translations","description":"Default Translation task uses Whisper model ability to translate to English, however Large-V3-Turbo is not compatible with this standard. Buzz supports additional AI translations to any other language.","sidebar":"tutorialSidebar"}}}')}}]); \ No newline at end of file diff --git a/assets/js/dbcee777.bee5d14d.js b/assets/js/dbcee777.bee5d14d.js new file mode 100644 index 00000000..38ab7d90 --- /dev/null +++ b/assets/js/dbcee777.bee5d14d.js @@ -0,0 +1 @@ +"use strict";(self.webpackChunkdocs=self.webpackChunkdocs||[]).push([[598],{3905:(e,t,n)=>{n.d(t,{Zo:()=>u,kt:()=>d});var a=n(7294);function r(e,t,n){return t in e?Object.defineProperty(e,t,{value:n,enumerable:!0,configurable:!0,writable:!0}):e[t]=n,e}function i(e,t){var n=Object.keys(e);if(Object.getOwnPropertySymbols){var a=Object.getOwnPropertySymbols(e);t&&(a=a.filter((function(t){return Object.getOwnPropertyDescriptor(e,t).enumerable}))),n.push.apply(n,a)}return n}function l(e){for(var t=1;t=0||(r[n]=e[n]);return r}(e,t);if(Object.getOwnPropertySymbols){var i=Object.getOwnPropertySymbols(e);for(a=0;a=0||Object.prototype.propertyIsEnumerable.call(e,n)&&(r[n]=e[n])}return r}var s=a.createContext({}),p=function(e){var t=a.useContext(s),n=t;return e&&(n="function"==typeof e?e(t):l(l({},t),e)),n},u=function(e){var t=p(e.components);return a.createElement(s.Provider,{value:t},e.children)},m="mdxType",c={inlineCode:"code",wrapper:function(e){var t=e.children;return a.createElement(a.Fragment,{},t)}},k=a.forwardRef((function(e,t){var n=e.components,r=e.mdxType,i=e.originalType,s=e.parentName,u=o(e,["components","mdxType","originalType","parentName"]),m=p(n),k=r,d=m["".concat(s,".").concat(k)]||m[k]||c[k]||i;return n?a.createElement(d,l(l({ref:t},u),{},{components:n})):a.createElement(d,l({ref:t},u))}));function d(e,t){var n=arguments,r=t&&t.mdxType;if("string"==typeof e||r){var i=n.length,l=new Array(i);l[0]=k;var o={};for(var s in t)hasOwnProperty.call(t,s)&&(o[s]=t[s]);o.originalType=e,o[m]="string"==typeof e?e:r,l[1]=o;for(var p=2;p{n.r(t),n.d(t,{assets:()=>s,contentTitle:()=>l,default:()=>c,frontMatter:()=>i,metadata:()=>o,toc:()=>p});var a=n(7462),r=(n(7294),n(3905));const i={},l="Transcription Viewer",o={unversionedId:"usage/transcription_viewer",id:"usage/transcription_viewer",title:"Transcription Viewer",description:"The Buzz transcription viewer provides a powerful interface for reviewing, editing, and navigating through your transcriptions. This guide covers all the features available in the transcription viewer.",source:"@site/docs/usage/5_transcription_viewer.md",sourceDirName:"usage",slug:"/usage/transcription_viewer",permalink:"/buzz/docs/usage/transcription_viewer",draft:!1,tags:[],version:"current",sidebarPosition:5,frontMatter:{},sidebar:"tutorialSidebar",previous:{title:"Speaker identification",permalink:"/buzz/docs/usage/speaker_identification"},next:{title:"Preferences",permalink:"/buzz/docs/preferences"}},s={},p=[{value:"Overview",id:"overview",level:2},{value:"Top Toolbar",id:"top-toolbar",level:2},{value:"View Mode Button",id:"view-mode-button",level:3},{value:"Export Button",id:"export-button",level:3},{value:"Translate Button",id:"translate-button",level:3},{value:"Resize Button",id:"resize-button",level:3},{value:"Playback Controls Button",id:"playback-controls-button",level:3},{value:"Find Button",id:"find-button",level:3},{value:"Scroll to Current Button",id:"scroll-to-current-button",level:3},{value:"Search Functionality",id:"search-functionality",level:2},{value:"Search Bar",id:"search-bar",level:3},{value:"Search Shortcuts",id:"search-shortcuts",level:3},{value:"Search Features",id:"search-features",level:3},{value:"Playback Controls",id:"playback-controls",level:2},{value:"Loop Segment",id:"loop-segment",level:3},{value:"Follow Audio",id:"follow-audio",level:3},{value:"Speed Controls",id:"speed-controls",level:3},{value:"Keyboard Shortcuts",id:"keyboard-shortcuts",level:2},{value:"Audio Playback",id:"audio-playback",level:3},{value:"Timestamp Adjustment",id:"timestamp-adjustment",level:3},{value:"Navigation",id:"navigation",level:3},{value:"Search",id:"search",level:3}],u={toc:p},m="wrapper";function c(e){let{components:t,...n}=e;return(0,r.kt)(m,(0,a.Z)({},u,n,{components:t,mdxType:"MDXLayout"}),(0,r.kt)("h1",{id:"transcription-viewer"},"Transcription Viewer"),(0,r.kt)("p",null,"The Buzz transcription viewer provides a powerful interface for reviewing, editing, and navigating through your transcriptions. This guide covers all the features available in the transcription viewer."),(0,r.kt)("h2",{id:"overview"},"Overview"),(0,r.kt)("p",null,"The transcription viewer is organized into several key sections:"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Top Toolbar"),": Contains view mode, export, translate, resize, and search"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Search Bar"),": Find and navigate through transcript text"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Transcription Segments"),": Table view of all transcription segments with timestamps"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Playback Controls"),": Audio playback settings and speed controls"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Audio Player"),": Standard media player with progress bar"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Current Segment Display"),": Shows the currently selected or playing segment")),(0,r.kt)("h2",{id:"top-toolbar"},"Top Toolbar"),(0,r.kt)("h3",{id:"view-mode-button"},"View Mode Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Switch between different viewing modes"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Options"),":",(0,r.kt)("ul",{parentName:"li"},(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Timestamps"),": Shows segments in a table format with start/end times"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Text"),": Shows combined text without timestamps"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Translation"),": Shows translated text (if available)")))),(0,r.kt)("h3",{id:"export-button"},"Export Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Export transcription in various formats"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Formats"),": SRT, VTT, TXT, JSON, and more"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),": Click to open export menu and select desired format")),(0,r.kt)("h3",{id:"translate-button"},"Translate Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Translate transcription to different languages"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),": Click to open translation settings and start translation")),(0,r.kt)("h3",{id:"resize-button"},"Resize Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Adjust transcription segment boundaries"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),": Click to open resize dialog for fine-tuning timestamps"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"More information"),": See ",(0,r.kt)("a",{parentName:"li",href:"https://chidiwilliams.github.io/buzz/docs/usage/edit_and_resize"},"Edit and Resize")," section")),(0,r.kt)("h3",{id:"playback-controls-button"},"Playback Controls Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Show/hide playback control panel"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Shortcut"),": ",(0,r.kt)("inlineCode",{parentName:"li"},"Ctrl+Alt+P")," (Windows/Linux) or ",(0,r.kt)("inlineCode",{parentName:"li"},"Cmd+Alt+P")," (macOS)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Behavior"),": Toggle button that shows/hides the playback controls below")),(0,r.kt)("h3",{id:"find-button"},"Find Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Show/hide search functionality"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Shortcut"),": ",(0,r.kt)("inlineCode",{parentName:"li"},"Ctrl+F")," (Windows/Linux) or ",(0,r.kt)("inlineCode",{parentName:"li"},"Cmd+F")," (macOS)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Behavior"),": Toggle button that shows/hides the search bar")),(0,r.kt)("h3",{id:"scroll-to-current-button"},"Scroll to Current Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Automatically scroll to the currently playing text"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Shortcut"),": ",(0,r.kt)("inlineCode",{parentName:"li"},"Ctrl+G")," (Windows/Linux) or ",(0,r.kt)("inlineCode",{parentName:"li"},"Cmd+G")," (macOS)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),": Click to jump to the current audio position in the transcript")),(0,r.kt)("h2",{id:"search-functionality"},"Search Functionality"),(0,r.kt)("h3",{id:"search-bar"},"Search Bar"),(0,r.kt)("p",null,"The search bar appears below the toolbar when activated and provides:"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Search Input"),": Type text to find in the transcription (wider input field for better usability)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Navigation"),": Up/down arrows to move between matches"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Status"),': Shows current match position and total matches (e.g., "3 of 15 matches")'),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Clear"),": Remove search text and results (larger button for better accessibility)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Results"),": Displays found text with context"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Consistent Button Sizing"),": All navigation buttons have uniform height for better visual consistency")),(0,r.kt)("h3",{id:"search-shortcuts"},"Search Shortcuts"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+F")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+F")),": Toggle search bar on/off"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Enter")),": Find next match"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Shift+Enter")),": Find previous match"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Escape")),": Close search bar")),(0,r.kt)("h3",{id:"search-features"},"Search Features"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Real-time Search"),": Results update as you type"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Case-insensitive"),": Finds matches regardless of capitalization"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Word Boundaries"),": Respects word boundaries for accurate matching"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Cross-view Search"),": Works in all view modes (Timestamps, Text, Translation)")),(0,r.kt)("h2",{id:"playback-controls"},"Playback Controls"),(0,r.kt)("h3",{id:"loop-segment"},"Loop Segment"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Automatically loop playback of selected segments"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),': Check the "Loop Segment" checkbox'),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Behavior"),": When enabled, clicking on a transcript segment will set a loop range"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Visual Feedback"),": Loop range is highlighted in the audio player")),(0,r.kt)("h3",{id:"follow-audio"},"Follow Audio"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Automatically scroll to current audio position"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),': Check the "Follow Audio" checkbox'),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Behavior"),": Transcript automatically follows the audio playback"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Benefits"),": Easy to follow along with long audio files")),(0,r.kt)("h3",{id:"speed-controls"},"Speed Controls"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Adjust audio playback speed"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Range"),": 0.5x to 2.0x speed"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Controls"),":",(0,r.kt)("ul",{parentName:"li"},(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Speed Dropdown"),": Select from preset speeds or enter custom value"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Decrease Button (-)"),": Reduce speed by 0.05x increments"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Increase Button (+)"),": Increase speed by 0.05x increments"))),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Persistence"),": Speed setting is saved between sessions"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Button Sizing"),": Speed control buttons match the size of search navigation buttons for visual consistency")),(0,r.kt)("h2",{id:"keyboard-shortcuts"},"Keyboard Shortcuts"),(0,r.kt)("h3",{id:"audio-playback"},"Audio Playback"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+P")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+P")),": Play/Pause audio"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+Shift+P")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+Shift+P")),": Replay current segment from start")),(0,r.kt)("h3",{id:"timestamp-adjustment"},"Timestamp Adjustment"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+\u2190")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+\u2190")),": Decrease segment start time by 0.5s"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+\u2192")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+\u2192")),": Increase segment start time by 0.5s"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+Shift+\u2190")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+Shift+\u2190")),": Decrease segment end time by 0.5s"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+Shift+\u2192")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+Shift+\u2192")),": Increase segment end time by 0.5s")),(0,r.kt)("h3",{id:"navigation"},"Navigation"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+F")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+F")),": Toggle search bar"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+Alt+P")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+Alt+P")),": Toggle playback controls"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+G")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+G")),": Scroll to current position"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+O")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+O")),": Open file import dialog")),(0,r.kt)("h3",{id:"search"},"Search"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Enter")),": Find next match"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Shift+Enter")),": Find previous match"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Escape")),": Close search bar")))}c.isMDXComponent=!0}}]); \ No newline at end of file diff --git a/assets/js/dbcee777.cca98005.js b/assets/js/dbcee777.cca98005.js deleted file mode 100644 index 87155aba..00000000 --- a/assets/js/dbcee777.cca98005.js +++ /dev/null @@ -1 +0,0 @@ -"use strict";(self.webpackChunkdocs=self.webpackChunkdocs||[]).push([[598],{3905:(e,t,n)=>{n.d(t,{Zo:()=>u,kt:()=>d});var a=n(7294);function r(e,t,n){return t in e?Object.defineProperty(e,t,{value:n,enumerable:!0,configurable:!0,writable:!0}):e[t]=n,e}function i(e,t){var n=Object.keys(e);if(Object.getOwnPropertySymbols){var a=Object.getOwnPropertySymbols(e);t&&(a=a.filter((function(t){return Object.getOwnPropertyDescriptor(e,t).enumerable}))),n.push.apply(n,a)}return n}function l(e){for(var t=1;t=0||(r[n]=e[n]);return r}(e,t);if(Object.getOwnPropertySymbols){var i=Object.getOwnPropertySymbols(e);for(a=0;a=0||Object.prototype.propertyIsEnumerable.call(e,n)&&(r[n]=e[n])}return r}var s=a.createContext({}),p=function(e){var t=a.useContext(s),n=t;return e&&(n="function"==typeof e?e(t):l(l({},t),e)),n},u=function(e){var t=p(e.components);return a.createElement(s.Provider,{value:t},e.children)},m="mdxType",c={inlineCode:"code",wrapper:function(e){var t=e.children;return a.createElement(a.Fragment,{},t)}},k=a.forwardRef((function(e,t){var n=e.components,r=e.mdxType,i=e.originalType,s=e.parentName,u=o(e,["components","mdxType","originalType","parentName"]),m=p(n),k=r,d=m["".concat(s,".").concat(k)]||m[k]||c[k]||i;return n?a.createElement(d,l(l({ref:t},u),{},{components:n})):a.createElement(d,l({ref:t},u))}));function d(e,t){var n=arguments,r=t&&t.mdxType;if("string"==typeof e||r){var i=n.length,l=new Array(i);l[0]=k;var o={};for(var s in t)hasOwnProperty.call(t,s)&&(o[s]=t[s]);o.originalType=e,o[m]="string"==typeof e?e:r,l[1]=o;for(var p=2;p{n.r(t),n.d(t,{assets:()=>s,contentTitle:()=>l,default:()=>c,frontMatter:()=>i,metadata:()=>o,toc:()=>p});var a=n(7462),r=(n(7294),n(3905));const i={},l="Transcription Viewer",o={unversionedId:"usage/transcription_viewer",id:"usage/transcription_viewer",title:"Transcription Viewer",description:"The Buzz transcription viewer provides a powerful interface for reviewing, editing, and navigating through your transcriptions. This guide covers all the features available in the transcription viewer.",source:"@site/docs/usage/5_transcription_viewer.md",sourceDirName:"usage",slug:"/usage/transcription_viewer",permalink:"/buzz/docs/usage/transcription_viewer",draft:!1,tags:[],version:"current",sidebarPosition:5,frontMatter:{},sidebar:"tutorialSidebar",previous:{title:"Speaker identification",permalink:"/buzz/docs/usage/speaker_identification"},next:{title:"Preferences",permalink:"/buzz/docs/preferences"}},s={},p=[{value:"Overview",id:"overview",level:2},{value:"Top Toolbar",id:"top-toolbar",level:2},{value:"View Mode Button",id:"view-mode-button",level:3},{value:"Export Button",id:"export-button",level:3},{value:"Translate Button",id:"translate-button",level:3},{value:"Resize Button",id:"resize-button",level:3},{value:"Playback Controls Button",id:"playback-controls-button",level:3},{value:"Find Button",id:"find-button",level:3},{value:"Scroll to Current Button",id:"scroll-to-current-button",level:3},{value:"Search Functionality",id:"search-functionality",level:2},{value:"Search Bar",id:"search-bar",level:3},{value:"Search Shortcuts",id:"search-shortcuts",level:3},{value:"Search Features",id:"search-features",level:3},{value:"Playback Controls",id:"playback-controls",level:2},{value:"Loop Segment",id:"loop-segment",level:3},{value:"Follow Audio",id:"follow-audio",level:3},{value:"Speed Controls",id:"speed-controls",level:3},{value:"Keyboard Shortcuts",id:"keyboard-shortcuts",level:2},{value:"Audio Playback",id:"audio-playback",level:3},{value:"Timestamp Adjustment",id:"timestamp-adjustment",level:3},{value:"Navigation",id:"navigation",level:3},{value:"Search",id:"search",level:3}],u={toc:p},m="wrapper";function c(e){let{components:t,...n}=e;return(0,r.kt)(m,(0,a.Z)({},u,n,{components:t,mdxType:"MDXLayout"}),(0,r.kt)("h1",{id:"transcription-viewer"},"Transcription Viewer"),(0,r.kt)("p",null,"The Buzz transcription viewer provides a powerful interface for reviewing, editing, and navigating through your transcriptions. This guide covers all the features available in the transcription viewer."),(0,r.kt)("h2",{id:"overview"},"Overview"),(0,r.kt)("p",null,"The transcription viewer is organized into several key sections:"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Top Toolbar"),": Contains view mode, export, translate, resize, and search"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Search Bar"),": Find and navigate through transcript text"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Transcription Segments"),": Table view of all transcription segments with timestamps"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Playback Controls"),": Audio playback settings and speed controls (since version 1.3.0)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Audio Player"),": Standard media player with progress bar"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Current Segment Display"),": Shows the currently selected or playing segment")),(0,r.kt)("h2",{id:"top-toolbar"},"Top Toolbar"),(0,r.kt)("h3",{id:"view-mode-button"},"View Mode Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Switch between different viewing modes"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Options"),":",(0,r.kt)("ul",{parentName:"li"},(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Timestamps"),": Shows segments in a table format with start/end times"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Text"),": Shows combined text without timestamps"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Translation"),": Shows translated text (if available)")))),(0,r.kt)("h3",{id:"export-button"},"Export Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Export transcription in various formats"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Formats"),": SRT, VTT, TXT, JSON, and more"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),": Click to open export menu and select desired format")),(0,r.kt)("h3",{id:"translate-button"},"Translate Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Translate transcription to different languages"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),": Click to open translation settings and start translation")),(0,r.kt)("h3",{id:"resize-button"},"Resize Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Adjust transcription segment boundaries"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),": Click to open resize dialog for fine-tuning timestamps"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"More information"),": See ",(0,r.kt)("a",{parentName:"li",href:"https://chidiwilliams.github.io/buzz/docs/usage/edit_and_resize"},"Edit and Resize")," section")),(0,r.kt)("h3",{id:"playback-controls-button"},"Playback Controls Button"),(0,r.kt)("p",null,"(since version 1.3.0)"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Show/hide playback control panel"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Shortcut"),": ",(0,r.kt)("inlineCode",{parentName:"li"},"Ctrl+Alt+P")," (Windows/Linux) or ",(0,r.kt)("inlineCode",{parentName:"li"},"Cmd+Alt+P")," (macOS)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Behavior"),": Toggle button that shows/hides the playback controls below")),(0,r.kt)("h3",{id:"find-button"},"Find Button"),(0,r.kt)("p",null,"(since version 1.3.0)"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Show/hide search functionality"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Shortcut"),": ",(0,r.kt)("inlineCode",{parentName:"li"},"Ctrl+F")," (Windows/Linux) or ",(0,r.kt)("inlineCode",{parentName:"li"},"Cmd+F")," (macOS)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Behavior"),": Toggle button that shows/hides the search bar")),(0,r.kt)("h3",{id:"scroll-to-current-button"},"Scroll to Current Button"),(0,r.kt)("p",null,"(since version 1.3.0)"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Automatically scroll to the currently playing text"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Shortcut"),": ",(0,r.kt)("inlineCode",{parentName:"li"},"Ctrl+G")," (Windows/Linux) or ",(0,r.kt)("inlineCode",{parentName:"li"},"Cmd+G")," (macOS)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),": Click to jump to the current audio position in the transcript")),(0,r.kt)("h2",{id:"search-functionality"},"Search Functionality"),(0,r.kt)("p",null,"(since version 1.3.0)"),(0,r.kt)("h3",{id:"search-bar"},"Search Bar"),(0,r.kt)("p",null,"The search bar appears below the toolbar when activated and provides:"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Search Input"),": Type text to find in the transcription (wider input field for better usability)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Navigation"),": Up/down arrows to move between matches"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Status"),': Shows current match position and total matches (e.g., "3 of 15 matches")'),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Clear"),": Remove search text and results (larger button for better accessibility)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Results"),": Displays found text with context"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Consistent Button Sizing"),": All navigation buttons have uniform height for better visual consistency")),(0,r.kt)("h3",{id:"search-shortcuts"},"Search Shortcuts"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+F")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+F")),": Toggle search bar on/off"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Enter")),": Find next match"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Shift+Enter")),": Find previous match"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Escape")),": Close search bar")),(0,r.kt)("h3",{id:"search-features"},"Search Features"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Real-time Search"),": Results update as you type"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Case-insensitive"),": Finds matches regardless of capitalization"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Word Boundaries"),": Respects word boundaries for accurate matching"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Cross-view Search"),": Works in all view modes (Timestamps, Text, Translation)")),(0,r.kt)("h2",{id:"playback-controls"},"Playback Controls"),(0,r.kt)("p",null,"(since version 1.3.0)"),(0,r.kt)("h3",{id:"loop-segment"},"Loop Segment"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Automatically loop playback of selected segments"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),': Check the "Loop Segment" checkbox'),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Behavior"),": When enabled, clicking on a transcript segment will set a loop range"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Visual Feedback"),": Loop range is highlighted in the audio player")),(0,r.kt)("h3",{id:"follow-audio"},"Follow Audio"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Automatically scroll to current audio position"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),': Check the "Follow Audio" checkbox'),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Behavior"),": Transcript automatically follows the audio playback"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Benefits"),": Easy to follow along with long audio files")),(0,r.kt)("h3",{id:"speed-controls"},"Speed Controls"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Adjust audio playback speed"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Range"),": 0.5x to 2.0x speed"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Controls"),":",(0,r.kt)("ul",{parentName:"li"},(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Speed Dropdown"),": Select from preset speeds or enter custom value"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Decrease Button (-)"),": Reduce speed by 0.05x increments"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Increase Button (+)"),": Increase speed by 0.05x increments"))),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Persistence"),": Speed setting is saved between sessions"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Button Sizing"),": Speed control buttons match the size of search navigation buttons for visual consistency")),(0,r.kt)("h2",{id:"keyboard-shortcuts"},"Keyboard Shortcuts"),(0,r.kt)("p",null,"(since version 1.3.0)"),(0,r.kt)("h3",{id:"audio-playback"},"Audio Playback"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+P")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+P")),": Play/Pause audio"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+Shift+P")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+Shift+P")),": Replay current segment from start")),(0,r.kt)("h3",{id:"timestamp-adjustment"},"Timestamp Adjustment"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+\u2190")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+\u2190")),": Decrease segment start time by 0.5s"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+\u2192")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+\u2192")),": Increase segment start time by 0.5s"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+Shift+\u2190")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+Shift+\u2190")),": Decrease segment end time by 0.5s"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+Shift+\u2192")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+Shift+\u2192")),": Increase segment end time by 0.5s")),(0,r.kt)("h3",{id:"navigation"},"Navigation"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+F")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+F")),": Toggle search bar"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+Alt+P")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+Alt+P")),": Toggle playback controls"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+G")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+G")),": Scroll to current position"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+O")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+O")),": Open file import dialog")),(0,r.kt)("h3",{id:"search"},"Search"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Enter")),": Find next match"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Shift+Enter")),": Find previous match"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Escape")),": Close search bar")))}c.isMDXComponent=!0}}]); \ No newline at end of file diff --git a/assets/js/runtime~main.02a8de98.js b/assets/js/runtime~main.bed7610c.js similarity index 73% rename from assets/js/runtime~main.02a8de98.js rename to assets/js/runtime~main.bed7610c.js index 81d486d8..0c2df813 100644 --- a/assets/js/runtime~main.02a8de98.js +++ b/assets/js/runtime~main.bed7610c.js @@ -1 +1 @@ -(()=>{"use strict";var e,t,r,o,a,n={},c={};function d(e){var t=c[e];if(void 0!==t)return t.exports;var r=c[e]={id:e,loaded:!1,exports:{}};return n[e].call(r.exports,r,r.exports,d),r.loaded=!0,r.exports}d.m=n,d.c=c,e=[],d.O=(t,r,o,a)=>{if(!r){var n=1/0;for(b=0;b=a)&&Object.keys(d.O).every((e=>d.O[e](r[f])))?r.splice(f--,1):(c=!1,a0&&e[b-1][2]>a;b--)e[b]=e[b-1];e[b]=[r,o,a]},d.n=e=>{var t=e&&e.__esModule?()=>e.default:()=>e;return d.d(t,{a:t}),t},r=Object.getPrototypeOf?e=>Object.getPrototypeOf(e):e=>e.__proto__,d.t=function(e,o){if(1&o&&(e=this(e)),8&o)return e;if("object"==typeof e&&e){if(4&o&&e.__esModule)return e;if(16&o&&"function"==typeof e.then)return e}var a=Object.create(null);d.r(a);var n={};t=t||[null,r({}),r([]),r(r)];for(var c=2&o&&e;"object"==typeof c&&!~t.indexOf(c);c=r(c))Object.getOwnPropertyNames(c).forEach((t=>n[t]=()=>e[t]));return n.default=()=>e,d.d(a,n),a},d.d=(e,t)=>{for(var r in t)d.o(t,r)&&!d.o(e,r)&&Object.defineProperty(e,r,{enumerable:!0,get:t[r]})},d.f={},d.e=e=>Promise.all(Object.keys(d.f).reduce(((t,r)=>(d.f[r](e,t),t)),[])),d.u=e=>"assets/js/"+({53:"935f2afb",150:"6ec58200",217:"3b8c55ea",237:"1df93b7f",382:"1102fda7",468:"1a20bc57",514:"1be78505",559:"36b603e5",598:"dbcee777",697:"409b9ecc",799:"2c266bbb",836:"0480b142",860:"3e407b54",884:"343de823",918:"17896441",958:"6dbc2e00",971:"c377a04b"}[e]||e)+"."+{53:"15830391",150:"8170897d",217:"cd236734",237:"71d7b441",382:"cd2bd517",468:"af8afb84",514:"131974b6",559:"6df0f804",598:"cca98005",697:"7778f743",799:"2d6b08c4",836:"6861ca9e",860:"987a7018",884:"d33c8b39",918:"0aaaf3b3",958:"24fcb0eb",971:"2f3d6e44",972:"d5cc17b1"}[e]+".js",d.miniCssF=e=>{},d.g=function(){if("object"==typeof globalThis)return globalThis;try{return this||new Function("return this")()}catch(e){if("object"==typeof window)return window}}(),d.o=(e,t)=>Object.prototype.hasOwnProperty.call(e,t),o={},a="docs:",d.l=(e,t,r,n)=>{if(o[e])o[e].push(t);else{var c,f;if(void 0!==r)for(var i=document.getElementsByTagName("script"),b=0;b{c.onerror=c.onload=null,clearTimeout(s);var a=o[e];if(delete o[e],c.parentNode&&c.parentNode.removeChild(c),a&&a.forEach((e=>e(r))),t)return t(r)},s=setTimeout(l.bind(null,void 0,{type:"timeout",target:c}),12e4);c.onerror=l.bind(null,c.onerror),c.onload=l.bind(null,c.onload),f&&document.head.appendChild(c)}},d.r=e=>{"undefined"!=typeof Symbol&&Symbol.toStringTag&&Object.defineProperty(e,Symbol.toStringTag,{value:"Module"}),Object.defineProperty(e,"__esModule",{value:!0})},d.p="/buzz/",d.gca=function(e){return e={17896441:"918","935f2afb":"53","6ec58200":"150","3b8c55ea":"217","1df93b7f":"237","1102fda7":"382","1a20bc57":"468","1be78505":"514","36b603e5":"559",dbcee777:"598","409b9ecc":"697","2c266bbb":"799","0480b142":"836","3e407b54":"860","343de823":"884","6dbc2e00":"958",c377a04b:"971"}[e]||e,d.p+d.u(e)},(()=>{var e={303:0,532:0};d.f.j=(t,r)=>{var o=d.o(e,t)?e[t]:void 0;if(0!==o)if(o)r.push(o[2]);else if(/^(303|532)$/.test(t))e[t]=0;else{var a=new Promise(((r,a)=>o=e[t]=[r,a]));r.push(o[2]=a);var n=d.p+d.u(t),c=new Error;d.l(n,(r=>{if(d.o(e,t)&&(0!==(o=e[t])&&(e[t]=void 0),o)){var a=r&&("load"===r.type?"missing":r.type),n=r&&r.target&&r.target.src;c.message="Loading chunk "+t+" failed.\n("+a+": "+n+")",c.name="ChunkLoadError",c.type=a,c.request=n,o[1](c)}}),"chunk-"+t,t)}},d.O.j=t=>0===e[t];var t=(t,r)=>{var o,a,n=r[0],c=r[1],f=r[2],i=0;if(n.some((t=>0!==e[t]))){for(o in c)d.o(c,o)&&(d.m[o]=c[o]);if(f)var b=f(d)}for(t&&t(r);i{"use strict";var e,t,r,o,a,n={},c={};function d(e){var t=c[e];if(void 0!==t)return t.exports;var r=c[e]={id:e,loaded:!1,exports:{}};return n[e].call(r.exports,r,r.exports,d),r.loaded=!0,r.exports}d.m=n,d.c=c,e=[],d.O=(t,r,o,a)=>{if(!r){var n=1/0;for(f=0;f=a)&&Object.keys(d.O).every((e=>d.O[e](r[i])))?r.splice(i--,1):(c=!1,a0&&e[f-1][2]>a;f--)e[f]=e[f-1];e[f]=[r,o,a]},d.n=e=>{var t=e&&e.__esModule?()=>e.default:()=>e;return d.d(t,{a:t}),t},r=Object.getPrototypeOf?e=>Object.getPrototypeOf(e):e=>e.__proto__,d.t=function(e,o){if(1&o&&(e=this(e)),8&o)return e;if("object"==typeof e&&e){if(4&o&&e.__esModule)return e;if(16&o&&"function"==typeof e.then)return e}var a=Object.create(null);d.r(a);var n={};t=t||[null,r({}),r([]),r(r)];for(var c=2&o&&e;"object"==typeof c&&!~t.indexOf(c);c=r(c))Object.getOwnPropertyNames(c).forEach((t=>n[t]=()=>e[t]));return n.default=()=>e,d.d(a,n),a},d.d=(e,t)=>{for(var r in t)d.o(t,r)&&!d.o(e,r)&&Object.defineProperty(e,r,{enumerable:!0,get:t[r]})},d.f={},d.e=e=>Promise.all(Object.keys(d.f).reduce(((t,r)=>(d.f[r](e,t),t)),[])),d.u=e=>"assets/js/"+({53:"935f2afb",150:"6ec58200",217:"3b8c55ea",237:"1df93b7f",382:"1102fda7",468:"1a20bc57",514:"1be78505",559:"36b603e5",598:"dbcee777",697:"409b9ecc",799:"2c266bbb",836:"0480b142",860:"3e407b54",884:"343de823",918:"17896441",958:"6dbc2e00",971:"c377a04b"}[e]||e)+"."+{53:"d422329a",150:"a3addc77",217:"cd236734",237:"71d7b441",382:"cd2bd517",468:"af8afb84",514:"131974b6",559:"55d4006f",598:"bee5d14d",697:"b74554d9",799:"7fe1d26b",836:"6861ca9e",860:"987a7018",884:"33e65bd6",918:"0aaaf3b3",958:"24fcb0eb",971:"2f3d6e44",972:"d5cc17b1"}[e]+".js",d.miniCssF=e=>{},d.g=function(){if("object"==typeof globalThis)return globalThis;try{return this||new Function("return this")()}catch(e){if("object"==typeof window)return window}}(),d.o=(e,t)=>Object.prototype.hasOwnProperty.call(e,t),o={},a="docs:",d.l=(e,t,r,n)=>{if(o[e])o[e].push(t);else{var c,i;if(void 0!==r)for(var b=document.getElementsByTagName("script"),f=0;f{c.onerror=c.onload=null,clearTimeout(s);var a=o[e];if(delete o[e],c.parentNode&&c.parentNode.removeChild(c),a&&a.forEach((e=>e(r))),t)return t(r)},s=setTimeout(l.bind(null,void 0,{type:"timeout",target:c}),12e4);c.onerror=l.bind(null,c.onerror),c.onload=l.bind(null,c.onload),i&&document.head.appendChild(c)}},d.r=e=>{"undefined"!=typeof Symbol&&Symbol.toStringTag&&Object.defineProperty(e,Symbol.toStringTag,{value:"Module"}),Object.defineProperty(e,"__esModule",{value:!0})},d.p="/buzz/",d.gca=function(e){return e={17896441:"918","935f2afb":"53","6ec58200":"150","3b8c55ea":"217","1df93b7f":"237","1102fda7":"382","1a20bc57":"468","1be78505":"514","36b603e5":"559",dbcee777:"598","409b9ecc":"697","2c266bbb":"799","0480b142":"836","3e407b54":"860","343de823":"884","6dbc2e00":"958",c377a04b:"971"}[e]||e,d.p+d.u(e)},(()=>{var e={303:0,532:0};d.f.j=(t,r)=>{var o=d.o(e,t)?e[t]:void 0;if(0!==o)if(o)r.push(o[2]);else if(/^(303|532)$/.test(t))e[t]=0;else{var a=new Promise(((r,a)=>o=e[t]=[r,a]));r.push(o[2]=a);var n=d.p+d.u(t),c=new Error;d.l(n,(r=>{if(d.o(e,t)&&(0!==(o=e[t])&&(e[t]=void 0),o)){var a=r&&("load"===r.type?"missing":r.type),n=r&&r.target&&r.target.src;c.message="Loading chunk "+t+" failed.\n("+a+": "+n+")",c.name="ChunkLoadError",c.type=a,c.request=n,o[1](c)}}),"chunk-"+t,t)}},d.O.j=t=>0===e[t];var t=(t,r)=>{var o,a,n=r[0],c=r[1],i=r[2],b=0;if(n.some((t=>0!==e[t]))){for(o in c)d.o(c,o)&&(d.m[o]=c[o]);if(i)var f=i(d)}for(t&&t(r);b Introduction | Buzz - + @@ -20,7 +20,7 @@ real-time, Whisper.cpp (with Vulkan GPU acceleration), Faster Whisper, Whisper-compatible Hugging Face models, and the OpenAI Whisper API
  • Command-Line Interface
  • Speech separation before transcription for better accuracy on noisy audio
  • Speaker identification in transcribed media
  • Available on Mac, Windows, and Linux
  • - + \ No newline at end of file diff --git a/docs/cli.html b/docs/cli.html index 589301c6..ce89023c 100644 --- a/docs/cli.html +++ b/docs/cli.html @@ -4,13 +4,13 @@ CLI | Buzz - +

    CLI

    Commands

    add

    Start a new transcription task.

    Usage: buzz add [options] [file url file...]

    Options:
    -t, --task <task> The task to perform. Allowed: translate,
    transcribe. Default: transcribe.
    -m, --model-type <model-type> Model type. Allowed: whisper, whispercpp,
    huggingface, fasterwhisper, openaiapi. Default:
    whisper.
    -s, --model-size <model-size> Model size. Use only when --model-type is
    whisper, whispercpp, or fasterwhisper. Allowed:
    tiny, base, small, medium, large. Default:
    tiny.
    --hfid <id> Hugging Face model ID. Use only when
    --model-type is huggingface. Example:
    "openai/whisper-tiny"
    -l, --language <code> Language code. Allowed: af (Afrikaans), am
    (Amharic), ar (Arabic), as (Assamese), az
    (Azerbaijani), ba (Bashkir), be (Belarusian),
    bg (Bulgarian), bn (Bengali), bo (Tibetan), br
    (Breton), bs (Bosnian), ca (Catalan), cs
    (Czech), cy (Welsh), da (Danish), de (German),
    el (Greek), en (English), es (Spanish), et
    (Estonian), eu (Basque), fa (Persian), fi
    (Finnish), fo (Faroese), fr (French), gl
    (Galician), gu (Gujarati), ha (Hausa), haw
    (Hawaiian), he (Hebrew), hi (Hindi), hr
    (Croatian), ht (Haitian Creole), hu
    (Hungarian), hy (Armenian), id (Indonesian), is
    (Icelandic), it (Italian), ja (Japanese), jw
    (Javanese), ka (Georgian), kk (Kazakh), km
    (Khmer), kn (Kannada), ko (Korean), la (Latin),
    lb (Luxembourgish), ln (Lingala), lo (Lao), lt
    (Lithuanian), lv (Latvian), mg (Malagasy), mi
    (Maori), mk (Macedonian), ml (Malayalam), mn
    (Mongolian), mr (Marathi), ms (Malay), mt
    (Maltese), my (Myanmar), ne (Nepali), nl
    (Dutch), nn (Nynorsk), no (Norwegian), oc
    (Occitan), pa (Punjabi), pl (Polish), ps
    (Pashto), pt (Portuguese), ro (Romanian), ru
    (Russian), sa (Sanskrit), sd (Sindhi), si
    (Sinhala), sk (Slovak), sl (Slovenian), sn
    (Shona), so (Somali), sq (Albanian), sr
    (Serbian), su (Sundanese), sv (Swedish), sw
    (Swahili), ta (Tamil), te (Telugu), tg (Tajik),
    th (Thai), tk (Turkmen), tl (Tagalog), tr
    (Turkish), tt (Tatar), uk (Ukrainian), ur
    (Urdu), uz (Uzbek), vi (Vietnamese), yi
    (Yiddish), yo (Yoruba), zh (Chinese). Leave
    empty to detect language.
    -p, --prompt <prompt> Initial prompt.
    -w, --word-timestamps Generate word-level timestamps. (available since 1.2.0)
    -e, --extract-speech Extract speech from audio before transcribing. (available since 1.3.0)
    --openai-token <token> OpenAI access token. Use only when
    --model-type is openaiapi. Defaults to your
    previously saved access token, if one exists.
    --srt Output result in an SRT file.
    --vtt Output result in a VTT file.
    --txt Output result in a TXT file.
    --hide-gui Hide the main application window. (available since 1.2.0)
    -h, --help Displays help on commandline options.
    --help-all Displays help including Qt specific options.
    -v, --version Displays version information.

    Arguments:
    files or urls Input file paths or urls. Url import availalbe since 1.2.0.

    Examples:

    # Translate two MP3 files from French to English using OpenAI Whisper API
    buzz add --task translate --language fr --model-type openaiapi /Users/user/Downloads/1b3b03e4-8db5-ea2c-ace5-b71ff32e3304.mp3 /Users/user/Downloads/koaf9083k1lkpsfdi0.mp3

    # Transcribe an MP4 using Whisper.cpp "small" model and immediately export to SRT and VTT files
    buzz add --task transcribe --model-type whispercpp --model-size small --prompt "My initial prompt" --srt --vtt /Users/user/Downloads/buzz/1b3b03e4-8db5-ea2c-ace5-b71ff32e3304.mp4
    - + \ No newline at end of file diff --git a/docs/faq.html b/docs/faq.html index a20f844c..57444633 100644 --- a/docs/faq.html +++ b/docs/faq.html @@ -4,7 +4,7 @@ FAQ | Buzz - + @@ -12,7 +12,7 @@

    FAQ

    1. Where are the models stored?

    The models are stored:

    • Linux: ~/.cache/Buzz
    • Mac OS: ~/Library/Caches/Buzz
    • Windows: %USERPROFILE%\AppData\Local\Buzz\Buzz\Cache

    Paste the location in your file manager to access the models or go to Help -> Preferences -> Models and click on Show file location button after downloading some model.

    2. What can I try if the transcription runs too slowly?

    Speech recognition requires large amount of computation, so one option is to try using a lower Whisper model size or using a Whisper.cpp model to run speech recognition of your computer. If you have access to a computer with GPU that has at least 6GB of VRAM you can try using the Faster Whisper model.

    Buzz also supports using OpenAI API to do speech recognition on a remote server. To use this feature you need to set OpenAI API key in Preferences. See Preferences section for more details.

    3. How to record system audio?

    To transcribe system audio you need to configure virtual audio device and connect output from the applications you want to transcribe to this virtual speaker. After that you can select it as source in the Buzz. See Usage section for more details.

    Relevant tools:

    4. What model should I use?

    Model size to use will depend on your hardware and use case. Smaller models will work faster but will have more inaccuracies. Larger models will be more accurate but will require more powerful hardware or longer time to transcribe.

    When choosing among large models consider the following. "Large" is the first released older model, "Large-V2" is later updated model with better accuracy, for some languages considered the most robust and stable. "Large-V3" is the latest model with the best accuracy in many cases, but some times can hallucinate or invent words that were never in the audio. "Turbo" model tries to get a good balance between speed and accuracy. The only sure way to know what model best suits your needs is to test them all in your language.

    In addition to choosing an appropriate model size you also can choose whisper type.

    • Whisper is initial OpenAI implementation, it is accurate but slow and requires a lot of RAM.
    • Faster Whisper is an optimized implementation, it is orders of magnitude faster than regular Whisper and requires less RAM. Use this option if you have an Nvidia GPU with at least 6GB of VRAM.
    • Whisper.cpp is optimized C++ implementation, it quite fast and efficient and will use any brand of GPU. Whisper.cpp is capable of running real time transcription even on a modern laptop with integrated GPU. It can also run on CPU only. Use this option if you do not have Nvidia GPU.
    • HuggingFace option is a Transformers implementation and is good in that it supports wide range of custom models that may be optimized for a particular language. This option also supports MMS family of models from Meta AI that support over 1000 of worlds languages as well as PEFT adjustments to Whisper models.

    5. How to get GPU acceleration for faster transcription?

    On Linux GPU acceleration is supported out of the box on Nvidia GPUs. If you still get any issues install CUDA 12, cuBLASS and cuDNN.

    On Windows GPU support is included in the installation .exe. CUDA 12 required, computers with older CUDA versions will use CPU. See this note on enabling CUDA GPU support.

    6. How to fix Unanticipated host error[PaErrorCode-9999]?

    Check if there are any system settings preventing apps from accessing the microphone.

    On Windows, see if Buzz has permission to use the microphone in Settings -> Privacy -> Microphone.

    See method 1 in this video https://www.youtube.com/watch?v=eRcCYgOuSYQ

    For method 2 there is no need to uninstall the antivirus, but see if you can temporarily disable it or if there are settings that may prevent Buzz from accessing the microphone.

    7. Can I use Buzz on a computer without internet?

    Yes, Buzz can be used without internet connection if you download the necessary models on some other computer that has the internet and manually move them to the offline computer. The easiest way to find where the models are stored is to go to Help -> Preferences -> Models. Then download some model, and push "Show file location" button. This will open the folder where the models are stored. Copy the models folder to the same location on the offline computer. F.e. for Linux it is .cache/Buzz/models in your home directory.

    8. Buzz crashes, what to do?

    If a model download was incomplete or corrupted, Buzz may crash. Try to delete the downloaded model files in Help -> Preferences -> Models and re-download them.

    If that does not help, check the log file for errors and report the issue so we can fix it. If possible attach the log file to the issue. Since Version 1.3.4, to get to the logs folder go to Help -> About Buzz and click on Show logs button.

    9. Where can I get latest development version?

    Latest development version will have latest bug fixes and most recent features. If you feel a bit adventurous it is recommended to try the latest development version as they needs some testing before they get released to everybody.

    • Linux users can get the latest version with this command sudo snap install buzz --edge

    • For other platforms do the following:

      1. Go to the build section
      2. Click on the link to the latest build, the most recent successful build entry in the list
      3. Scroll down to the artifacts section in the build page
      4. Download the installation file. Please note that you need to be logged in the Github to see the download links. Latest build example

    10. Why is my system theme not applied to Buzz installed from Flatpak?

    For dark themes on Gnome environments you may need to install gnome-themes-extra package and set the following preferences:

    gsettings set org.gnome.desktop.interface gtk-theme Adwaita-dark
    gsettings set org.gnome.desktop.interface color-scheme prefer-dark

    If your system theme is not applied to Buzz installed from Flatpak Linux app store, ensure the desired theme is in ~/.themes folder.

    You may need to copy the system themes to this folder cp -r /usr/share/themes/ ~/.themes/ and give Flatpaks access to this folder flatpak override --user --filesystem=~/.themes.

    On Fedora run the following to install the necessary packages sudo dnf install gnome-themes-extra qadwaitadecorations-qt{5,6} qt{5,6}-qtwayland

    - + \ No newline at end of file diff --git a/docs/installation.html b/docs/installation.html index d6797b7f..2c524876 100644 --- a/docs/installation.html +++ b/docs/installation.html @@ -4,14 +4,14 @@ Installation | Buzz - +

    Installation

    To install Buzz, download the latest version for your operating system. Buzz is available on Mac (Intel and Apple silicon), Windows, and Linux.

    macOS

    Download the .dmg from the SourceForge.

    Windows

    Get the installation files from the SourceForge.

    App is not signed, you will get a warning when you install it. Select More info -> Run anyway.

    Linux

    Buzz is available as a Flatpak or a Snap.

    To install flatpak, run:

    flatpak install flathub io.github.chidiwilliams.Buzz

    Download on Flathub

    To install snap, run:

    sudo apt-get install libportaudio2 libcanberra-gtk-module libcanberra-gtk3-module
    sudo snap install buzz
    sudo snap connect buzz:password-manager-service

    Get it from the Snap Store

    PyPI

    pip install buzz-captions
    python -m buzz

    On Linux install system dependencies you may be missing

    sudo apt-get install --no-install-recommends libyaml-dev libtbb-dev libxkbcommon-x11-0 libxcb-icccm4 libxcb-image0 libxcb-keysyms1 libxcb-randr0 libxcb-render-util0 libxcb-xinerama0 libxcb-shape0 libxcb-cursor0 libportaudio2 gettext libpulse0 ffmpeg

    On versions prior to Ubuntu 24.04 install sudo apt-get install --no-install-recommends libegl1-mesa

    - + \ No newline at end of file diff --git a/docs/preferences.html b/docs/preferences.html index ba2a4279..9d5b23a0 100644 --- a/docs/preferences.html +++ b/docs/preferences.html @@ -4,7 +4,7 @@ Preferences | Buzz - + @@ -23,7 +23,7 @@ larger model. For example q_5 version. Whisper.cpp base models in d Increasing number of threads even more will lead in slower transcription time as results from parallel threads has to be combined to produce the final answer.

    BUZZ_TRANSLATION_API_BASE_URL - Base URL of OpenAI compatible API to use for translation.

    BUZZ_TRANSLATION_API_KEY - Api key of OpenAI compatible API to use for translation.

    BUZZ_MODEL_ROOT - Root directory to store model files. You may also want to set HF_HOME to the same folder as some libraries used in Buzz download their models independently. Defaults to user_cache_dir.

    BUZZ_FAVORITE_LANGUAGES - Coma separated list of supported language codes to show on top of language list.

    BUZZ_DOWNLOAD_COOKIEFILE - Location of a cookiefile to use for downloading private videos or as workaround for anti-bot protection.

    BUZZ_FORCE_CPU - Will force Buzz to use CPU and not GPU, useful for setups with older GPU if that is slower than GPU or GPU has issues. Example usage BUZZ_FORCE_CPU=true. Available since 1.2.1

    BUZZ_REDUCE_GPU_MEMORY - Will use 8bit quantization for Huggingface adn Faster Whisper transcriptions to reduce required GPU memory. Example usage BUZZ_REDUCE_GPU_MEMORY=true. Available since 1.4.0

    BUZZ_MERGE_REGROUP_RULE - Custom regroup merge rule to use when combining transcripts with word-level timings. More information on available options in stable-ts repo. Available since 1.3.0

    BUZZ_DISABLE_TELEMETRY - Buzz collects basic OS name and architecture usage statistics to better focus development efforts. This variable lets disable collection of these statistics. Example usage BUZZ_DISABLE_TELEMETRY=true. Available since 1.3.0

    BUZZ_UPLOAD_URL - Live recording transcripts and translations can be uploaded to a server for display on the web. Set this variable to the desired upload url. You can use buzz-transcription-server as a server. Buzz will upload the following json via POST requests - {"kind": "transcript", "text": "Sample transcript"} or {"kind": "translation", "text": "Sample translation"}. Example usage BUZZ_UPLOAD_URL=http://localhost:5000/upload. Available since 1.3.0

    Example of data collected by telemetry:

    Buzz: 1.3.0, locale: ('lv_LV', 'UTF-8'), system: Linux, release: 6.14.0-27-generic, machine: x86_64, version: #27~24.04.1-Ubuntu SMP PREEMPT_DYNAMIC Tue Jul 22 17:38:49 UTC 2,

    BUZZ_PARAGRAPH_SPLIT_TIME - Time in milliseconds of silence to split paragraphs in transcript and add two newlines when exporting the transcripts as text. Default is 2000 or 2 seconds. Available since 1.3.0

    - + \ No newline at end of file diff --git a/docs/usage/edit_and_resize.html b/docs/usage/edit_and_resize.html index 0b79e1d0..a93dc9d7 100644 --- a/docs/usage/edit_and_resize.html +++ b/docs/usage/edit_and_resize.html @@ -4,13 +4,13 @@ Edit and Resize | Buzz - +
    -

    Edit and Resize

    Resize options

    When transcript of some audio or video file is generated you can edit it and export to different subtitle formats or plain text. Double-click the transcript in the list of transcripts to see additional options for editing and exporting.

    Transcription view screen has option to resize the transcripts. Click on the "Resize" button so see available options. Transcripts that have been generated with word-level timings setting enabled can be combined into subtitles specifying different options, like maximum length of a subtitle and if subtitles should be split on punctuation. For transcripts that have been generated without word-level timings setting enabled can only be recombined specifying desired max length of a subtitle.

    If audio file is still present on the system word-level timing merge will also analyze the audio for silences to improve subtitle accuracy. Subtitle generation from transcripts with word-level timings is available since version 1.3.0.

    The resize tool also has an option to extend end time of segments if you want the subtitles to be on the screen for longer. You can specify the amount of time in seconds to extend each subtitle segment. Buzz will add this amount of time to the end of each subtitle segment making sure that the end of a segment does not go over start of the next segment. This feature is available since 1.4.3.

    - +

    Edit and Resize

    Resize options

    When transcript of some audio or video file is generated you can edit it and export to different subtitle formats or plain text. Double-click the transcript in the list of transcripts to see additional options for editing and exporting.

    Transcription view screen has option to resize the transcripts. Click on the "Resize" button so see available options. Transcripts that have been generated with word-level timings setting enabled can be combined into subtitles specifying different options, like maximum length of a subtitle and if subtitles should be split on punctuation. For transcripts that have been generated without word-level timings setting enabled can only be recombined specifying desired max length of a subtitle.

    If audio file is still present on the system word-level timing merge will also analyze the audio for silences to improve subtitle accuracy.

    The resize tool also has an option to extend end time of segments if you want the subtitles to be on the screen for longer. You can specify the amount of time in seconds to extend each subtitle segment. Buzz will add this amount of time to the end of each subtitle segment making sure that the end of a segment does not go over start of the next segment. This feature is available since 1.4.3.

    + \ No newline at end of file diff --git a/docs/usage/file_import.html b/docs/usage/file_import.html index 60af79e5..65b3860f 100644 --- a/docs/usage/file_import.html +++ b/docs/usage/file_import.html @@ -4,14 +4,14 @@ File Import | Buzz - +

    File Import

    To import a file:

    • Click Import Media File on the File menu (or the '+' icon on the toolbar, or Command/Ctrl + O).
    • Choose an audio or video file.
    • Select a task, language, and the model settings.
    • Click Run.
    • When the transcription status shows 'Completed', double-click on the row (or select the row and click the '⤢' icon) to -open the transcription.

    Available options:

    To reduce misspellings you can pass some commonly misspelled words in an Initial prompt that is available under Advanced... button. See this guide on prompting.

    FieldOptionsDefaultDescription
    Export As"TXT", "SRT", "VTT""TXT"Export file format
    Word-Level TimingsOff / OnOffIf checked, the transcription will generate a separate subtitle line for each word in the audio. Combine words into subtitles afterwards with the resize option.
    Extract speechOff / OnOffIf checked, speech will be extracted to a separate audio tack to improve accuracy. Available since 1.3.0.

    (See the Live Recording section for more information about the task, language, and quality settings.)

    Media File Import on Buzz

    💡 Tip: It is recommended to always select language to transcribe to as automatic language detection may result in unexpected results.

    - +open the transcription.

    Available options:

    To reduce misspellings you can pass some commonly misspelled words in an Initial prompt that is available under Advanced... button. See this guide on prompting.

    FieldOptionsDefaultDescription
    Export As"TXT", "SRT", "VTT""TXT"Export file format
    Word-Level TimingsOff / OnOffIf checked, the transcription will generate a separate subtitle line for each word in the audio. Combine words into subtitles afterwards with the resize option.
    Extract speechOff / OnOffIf checked, speech will be extracted to a separate audio tack to improve accuracy.

    (See the Live Recording section for more information about the task, language, and quality settings.)

    Media File Import on Buzz

    💡 Tip: It is recommended to always select language to transcribe to as automatic language detection may result in unexpected results.

    + \ No newline at end of file diff --git a/docs/usage/live_recording.html b/docs/usage/live_recording.html index cb212dc9..01a3b2fb 100644 --- a/docs/usage/live_recording.html +++ b/docs/usage/live_recording.html @@ -4,21 +4,20 @@ Live Recording | Buzz - +

    Live Recording

    To start a live recording:

    • Select a recording task, language, quality, and microphone.
    • Click Record.

    Note: Transcribing audio using the default Whisper model is resource-intensive. Consider using the Whisper.cpp. -It supports GPU acceleration, if the model fits in GPU memory. Use smaller models for real-time performance.

    FieldOptionsDefaultDescription
    Task"Transcribe", "Translate to English""Transcribe""Transcribe" converts the input audio into text in the selected language, while "Translate to English" converts it into text in English.
    LanguageSee Whisper's documentation for the full list of supported languages"Detect Language""Detect Language" will try to detect the spoken language in the audio based on the first few seconds. However, selecting a language is recommended (if known) as it will improve transcription quality in many cases.
    Microphone[Available system microphones][Default system microphone]Microphone for recording input audio.

    Live Recording on Buzz

    Advanced preferences

    Silence threshold Set threshold to for transcriptions to be processed. If average volume level is under this setting the sentence will not be transcribed. Available since 1.4.4. -Line separator Marking to add to the transcription and translation lines. Default value is two new lines (\n\n) that result in an empty space between translation or transcription lines. To have no empty line use \n. Available since 1.4.4.

    Presentation Window

    Since 1.4.2 Buzz has an easy to use presentation window you can use to show live transcriptions during events and presentations. To open it start the recording and new options for the Presentation window will appear.

    Record audio playing from computer (macOS)

    To record audio playing from an application on your computer, you may install an audio loopback driver (a program that +It supports GPU acceleration, if the model fits in GPU memory. Use smaller models for real-time performance.

    FieldOptionsDefaultDescription
    Task"Transcribe", "Translate to English""Transcribe""Transcribe" converts the input audio into text in the selected language, while "Translate to English" converts it into text in English.
    LanguageSee Whisper's documentation for the full list of supported languages"Detect Language""Detect Language" will try to detect the spoken language in the audio based on the first few seconds. However, selecting a language is recommended (if known) as it will improve transcription quality in many cases.
    Microphone[Available system microphones][Default system microphone]Microphone for recording input audio.

    Live Recording on Buzz

    Advanced preferences

    Silence threshold Set threshold to for transcriptions to be processed. If average volume level is under this setting the sentence will not be transcribed. Available since 1.4.4.

    Line separator Marking to add to the transcription and translation lines. Default value is two new lines (\n\n) that result in an empty space between translation or transcription lines. To have no empty line use \n. Available since 1.4.4.

    Transcription step If live recording mode is set to Append and correct, you can also set a transcription step. Shorter steps will reduce latency but cause larger load on the system. Monitor the Queue while transcribing in this mode, if it grows too much, increase the transcription step, to reduce load. Available since 1.4.4.

    Hide unconfirmed If live recording mode is set to Append and correct, you can also hide the unconfirmed part of the last transcript. This part may be incorrect as the Buzz has seen it only in one overlapping transcription segment. Hiding it will increase latency, but result will show only the correct transcripts. Available since 1.4.4.

    Presentation Window

    Buzz has an easy to use presentation window you can use to show live transcriptions during events and presentations. To open it start the recording and new options for the Presentation window will appear.

    Record audio playing from computer (macOS)

    To record audio playing from an application on your computer, you may install an audio loopback driver (a program that lets you create virtual audio devices). The rest of this guide will use BlackHole on Mac, but you can use other alternatives for your operating system ( see LoopBeAudio, LoopBack, and Virtual Audio Cable).

    1. Install BlackHole via Homebrew

      brew install blackhole-2ch
    2. Open Audio MIDI Setup from Spotlight or from /Applications/Utilities/Audio Midi Setup.app.

      Open Audio MIDI Setup from Spotlight

    3. Click the '+' icon at the lower left corner and select 'Create Multi-Output Device'.

      Create multi-output device

    4. Add your default speaker and BlackHole to the multi-output device.

      Screenshot of multi-output device

    5. Select this multi-output device as your speaker (application or system-wide) to play audio into BlackHole.

    6. Open Buzz, select BlackHole as your microphone, and record as before to see transcriptions from the audio playing through BlackHole.

    Record audio playing from computer (Windows)

    To transcribe system audio you need to configure virtual audio device and connect output from the applications you whant to transcribe to this virtual speaker. After that you can select it as source in the Buzz.

    1. Install VB CABLE as virtual audio device.

    2. Configure using Windows Sound settings. Right-click on the speaker icon in the system tray and select "Open Sound settings". In the "Choose your output device" dropdown select "CABLE Input" to send all system sound to the virtual device or use "Advanced sound options" to select application that will output their sound to this device.

    Record audio playing from computer (Linux)

    As described on Ubuntu Wiki on any Linux with pulse audio you can redirect application audio to a virtual speaker. After that you can select it as source in Buzz.

    Overall steps:

    1. Launch application that will produce the sound you want to transcribe and start the playback. For example start a video in a media player.
    2. Launch Buzz and open Live recording screen, so you see the settings.
    3. Configure sound routing from the application you want to transcribe sound from to Buzz in Recording tab of the PulseAudio Volume Control (pavucontrol).
    - + \ No newline at end of file diff --git a/docs/usage/speaker_identification.html b/docs/usage/speaker_identification.html index d258b122..555a659e 100644 --- a/docs/usage/speaker_identification.html +++ b/docs/usage/speaker_identification.html @@ -4,13 +4,13 @@ Speaker identification | Buzz - +
    -

    Speaker identification

    When transcript of some audio or video file is generated you can identify speakers in the transcript. Double-click the transcript in the list of transcripts to see additional options for editing and exporting.

    Transcription view screen has option to identify speakers. Click on the "Identify speakers" button so see available options.

    If audio file is still present on the system speaker identification will mark each speakers sentences with appropriate label. You can preview 10 seconds of some random sentence of the identified speaker and rename the automatically identified label to speakers real name. If "Merge speaker sentences" checkbox is selected when you save the speaker labels, all consecutive sentences of the same speaker will be merged into one segment. Speaker identification is available since version 1.4.0 on all platforms except Intel macOS.

    - +

    Speaker identification

    When transcript of some audio or video file is generated you can identify speakers in the transcript. Double-click the transcript in the list of transcripts to see additional options for editing and exporting.

    Transcription view screen has option to identify speakers. Click on the "Identify speakers" button so see available options.

    If audio file is still present on the system speaker identification will mark each speakers sentences with appropriate label. You can preview 10 seconds of some random sentence of the identified speaker and rename the automatically identified label to speakers real name. If "Merge speaker sentences" checkbox is selected when you save the speaker labels, all consecutive sentences of the same speaker will be merged into one segment. Speaker identification is not available on Intel macOS.

    + \ No newline at end of file diff --git a/docs/usage/transcription_viewer.html b/docs/usage/transcription_viewer.html index 4a8bf4da..395de6c3 100644 --- a/docs/usage/transcription_viewer.html +++ b/docs/usage/transcription_viewer.html @@ -4,13 +4,13 @@ Transcription Viewer | Buzz - +
    -

    Transcription Viewer

    The Buzz transcription viewer provides a powerful interface for reviewing, editing, and navigating through your transcriptions. This guide covers all the features available in the transcription viewer.

    Overview

    The transcription viewer is organized into several key sections:

    • Top Toolbar: Contains view mode, export, translate, resize, and search
    • Search Bar: Find and navigate through transcript text
    • Transcription Segments: Table view of all transcription segments with timestamps
    • Playback Controls: Audio playback settings and speed controls (since version 1.3.0)
    • Audio Player: Standard media player with progress bar
    • Current Segment Display: Shows the currently selected or playing segment

    Top Toolbar

    View Mode Button

    • Function: Switch between different viewing modes
    • Options:
      • Timestamps: Shows segments in a table format with start/end times
      • Text: Shows combined text without timestamps
      • Translation: Shows translated text (if available)

    Export Button

    • Function: Export transcription in various formats
    • Formats: SRT, VTT, TXT, JSON, and more
    • Usage: Click to open export menu and select desired format

    Translate Button

    • Function: Translate transcription to different languages
    • Usage: Click to open translation settings and start translation

    Resize Button

    • Function: Adjust transcription segment boundaries
    • Usage: Click to open resize dialog for fine-tuning timestamps
    • More information: See Edit and Resize section

    Playback Controls Button

    (since version 1.3.0)

    • Function: Show/hide playback control panel
    • Shortcut: Ctrl+Alt+P (Windows/Linux) or Cmd+Alt+P (macOS)
    • Behavior: Toggle button that shows/hides the playback controls below

    Find Button

    (since version 1.3.0)

    • Function: Show/hide search functionality
    • Shortcut: Ctrl+F (Windows/Linux) or Cmd+F (macOS)
    • Behavior: Toggle button that shows/hides the search bar

    Scroll to Current Button

    (since version 1.3.0)

    • Function: Automatically scroll to the currently playing text
    • Shortcut: Ctrl+G (Windows/Linux) or Cmd+G (macOS)
    • Usage: Click to jump to the current audio position in the transcript

    Search Functionality

    (since version 1.3.0)

    The search bar appears below the toolbar when activated and provides:

    • Search Input: Type text to find in the transcription (wider input field for better usability)
    • Navigation: Up/down arrows to move between matches
    • Status: Shows current match position and total matches (e.g., "3 of 15 matches")
    • Clear: Remove search text and results (larger button for better accessibility)
    • Results: Displays found text with context
    • Consistent Button Sizing: All navigation buttons have uniform height for better visual consistency

    Search Shortcuts

    • Ctrl+F / Cmd+F: Toggle search bar on/off
    • Enter: Find next match
    • Shift+Enter: Find previous match
    • Escape: Close search bar

    Search Features

    • Real-time Search: Results update as you type
    • Case-insensitive: Finds matches regardless of capitalization
    • Word Boundaries: Respects word boundaries for accurate matching
    • Cross-view Search: Works in all view modes (Timestamps, Text, Translation)

    Playback Controls

    (since version 1.3.0)

    Loop Segment

    • Function: Automatically loop playback of selected segments
    • Usage: Check the "Loop Segment" checkbox
    • Behavior: When enabled, clicking on a transcript segment will set a loop range
    • Visual Feedback: Loop range is highlighted in the audio player

    Follow Audio

    • Function: Automatically scroll to current audio position
    • Usage: Check the "Follow Audio" checkbox
    • Behavior: Transcript automatically follows the audio playback
    • Benefits: Easy to follow along with long audio files

    Speed Controls

    • Function: Adjust audio playback speed
    • Range: 0.5x to 2.0x speed
    • Controls:
      • Speed Dropdown: Select from preset speeds or enter custom value
      • Decrease Button (-): Reduce speed by 0.05x increments
      • Increase Button (+): Increase speed by 0.05x increments
    • Persistence: Speed setting is saved between sessions
    • Button Sizing: Speed control buttons match the size of search navigation buttons for visual consistency

    Keyboard Shortcuts

    (since version 1.3.0)

    Audio Playback

    • Ctrl+P / Cmd+P: Play/Pause audio
    • Ctrl+Shift+P / Cmd+Shift+P: Replay current segment from start

    Timestamp Adjustment

    • Ctrl+← / Cmd+←: Decrease segment start time by 0.5s
    • Ctrl+→ / Cmd+→: Increase segment start time by 0.5s
    • Ctrl+Shift+← / Cmd+Shift+←: Decrease segment end time by 0.5s
    • Ctrl+Shift+→ / Cmd+Shift+→: Increase segment end time by 0.5s
    • Ctrl+F / Cmd+F: Toggle search bar
    • Ctrl+Alt+P / Cmd+Alt+P: Toggle playback controls
    • Ctrl+G / Cmd+G: Scroll to current position
    • Ctrl+O / Cmd+O: Open file import dialog
    • Enter: Find next match
    • Shift+Enter: Find previous match
    • Escape: Close search bar
    - +

    Transcription Viewer

    The Buzz transcription viewer provides a powerful interface for reviewing, editing, and navigating through your transcriptions. This guide covers all the features available in the transcription viewer.

    Overview

    The transcription viewer is organized into several key sections:

    • Top Toolbar: Contains view mode, export, translate, resize, and search
    • Search Bar: Find and navigate through transcript text
    • Transcription Segments: Table view of all transcription segments with timestamps
    • Playback Controls: Audio playback settings and speed controls
    • Audio Player: Standard media player with progress bar
    • Current Segment Display: Shows the currently selected or playing segment

    Top Toolbar

    View Mode Button

    • Function: Switch between different viewing modes
    • Options:
      • Timestamps: Shows segments in a table format with start/end times
      • Text: Shows combined text without timestamps
      • Translation: Shows translated text (if available)

    Export Button

    • Function: Export transcription in various formats
    • Formats: SRT, VTT, TXT, JSON, and more
    • Usage: Click to open export menu and select desired format

    Translate Button

    • Function: Translate transcription to different languages
    • Usage: Click to open translation settings and start translation

    Resize Button

    • Function: Adjust transcription segment boundaries
    • Usage: Click to open resize dialog for fine-tuning timestamps
    • More information: See Edit and Resize section

    Playback Controls Button

    • Function: Show/hide playback control panel
    • Shortcut: Ctrl+Alt+P (Windows/Linux) or Cmd+Alt+P (macOS)
    • Behavior: Toggle button that shows/hides the playback controls below

    Find Button

    • Function: Show/hide search functionality
    • Shortcut: Ctrl+F (Windows/Linux) or Cmd+F (macOS)
    • Behavior: Toggle button that shows/hides the search bar

    Scroll to Current Button

    • Function: Automatically scroll to the currently playing text
    • Shortcut: Ctrl+G (Windows/Linux) or Cmd+G (macOS)
    • Usage: Click to jump to the current audio position in the transcript

    Search Functionality

    The search bar appears below the toolbar when activated and provides:

    • Search Input: Type text to find in the transcription (wider input field for better usability)
    • Navigation: Up/down arrows to move between matches
    • Status: Shows current match position and total matches (e.g., "3 of 15 matches")
    • Clear: Remove search text and results (larger button for better accessibility)
    • Results: Displays found text with context
    • Consistent Button Sizing: All navigation buttons have uniform height for better visual consistency

    Search Shortcuts

    • Ctrl+F / Cmd+F: Toggle search bar on/off
    • Enter: Find next match
    • Shift+Enter: Find previous match
    • Escape: Close search bar

    Search Features

    • Real-time Search: Results update as you type
    • Case-insensitive: Finds matches regardless of capitalization
    • Word Boundaries: Respects word boundaries for accurate matching
    • Cross-view Search: Works in all view modes (Timestamps, Text, Translation)

    Playback Controls

    Loop Segment

    • Function: Automatically loop playback of selected segments
    • Usage: Check the "Loop Segment" checkbox
    • Behavior: When enabled, clicking on a transcript segment will set a loop range
    • Visual Feedback: Loop range is highlighted in the audio player

    Follow Audio

    • Function: Automatically scroll to current audio position
    • Usage: Check the "Follow Audio" checkbox
    • Behavior: Transcript automatically follows the audio playback
    • Benefits: Easy to follow along with long audio files

    Speed Controls

    • Function: Adjust audio playback speed
    • Range: 0.5x to 2.0x speed
    • Controls:
      • Speed Dropdown: Select from preset speeds or enter custom value
      • Decrease Button (-): Reduce speed by 0.05x increments
      • Increase Button (+): Increase speed by 0.05x increments
    • Persistence: Speed setting is saved between sessions
    • Button Sizing: Speed control buttons match the size of search navigation buttons for visual consistency

    Keyboard Shortcuts

    Audio Playback

    • Ctrl+P / Cmd+P: Play/Pause audio
    • Ctrl+Shift+P / Cmd+Shift+P: Replay current segment from start

    Timestamp Adjustment

    • Ctrl+← / Cmd+←: Decrease segment start time by 0.5s
    • Ctrl+→ / Cmd+→: Increase segment start time by 0.5s
    • Ctrl+Shift+← / Cmd+Shift+←: Decrease segment end time by 0.5s
    • Ctrl+Shift+→ / Cmd+Shift+→: Increase segment end time by 0.5s
    • Ctrl+F / Cmd+F: Toggle search bar
    • Ctrl+Alt+P / Cmd+Alt+P: Toggle playback controls
    • Ctrl+G / Cmd+G: Scroll to current position
    • Ctrl+O / Cmd+O: Open file import dialog
    • Enter: Find next match
    • Shift+Enter: Find previous match
    • Escape: Close search bar
    + \ No newline at end of file diff --git a/docs/usage/translations.html b/docs/usage/translations.html index ff42b8ef..37062510 100644 --- a/docs/usage/translations.html +++ b/docs/usage/translations.html @@ -3,14 +3,14 @@ -Translations | Buzz - +Translations | Buzz +
    -

    Translations

    Default Translation task uses Whisper model ability to translate to English, however Large-V3-Turbo is not compatible with this standard. Since version 1.0.0 Buzz supports additional AI translations to any other language.

    To use translation feature you will need to configure OpenAI API key and translation settings. Set OpenAI API ket in Preferences. Buzz also supports custom locally running translation AIs that support OpenAI API. For more information on locally running AIs see ollama or LM Studio. For information on available custom APIs see this discussion thread.

    To configure translation for Live recordings enable it in Advances settings dialog of the Live Recording settings. Enter AI model to use and prompt with instructions for the AI on how to translate. Translation option is also available for files that already have speech recognised. Use Translate button on transcription viewer toolbar.

    For AI to know how to translate enter translation instructions in the "Instructions for AI" section. In your instructions you should describe to what language you want it to translate the text to. Also, you may need to add additional instructions to not add any notes or comments as AIs tend to add them. Example instructions to translate English subtitles to Spanish:

    You are a professional translator, skilled in translating English to Spanish. You will only translate each sentence sent to you into Spanish and not add any notes or comments.

    If you enable "Enable live recording transcription export" in Preferences, Live text transcripts will be exported to a text file as they get generated and translated. This file can be used to further integrate Live transcripts with other applications like OBS Studio.

    Approximate cost of translation for 1 hour long audio with ChatGPT gpt-4o model is around $0.50.

    - +

    Translations

    Default Translation task uses Whisper model ability to translate to English, however Large-V3-Turbo is not compatible with this standard. Buzz supports additional AI translations to any other language.

    To use translation feature you will need to configure OpenAI API key and translation settings. Set OpenAI API ket in Preferences. Buzz also supports custom locally running translation AIs that support OpenAI API. For more information on locally running AIs see ollama or LM Studio. For information on available custom APIs see this discussion thread.

    To configure translation for Live recordings enable it in Advances settings dialog of the Live Recording settings. Enter AI model to use and prompt with instructions for the AI on how to translate. Translation option is also available for files that already have speech recognised. Use Translate button on transcription viewer toolbar.

    For AI to know how to translate enter translation instructions in the "Instructions for AI" section. In your instructions you should describe to what language you want it to translate the text to. Also, you may need to add additional instructions to not add any notes or comments as AIs tend to add them. Example instructions to translate English subtitles to Spanish:

    You are a professional translator, skilled in translating English to Spanish. You will only translate each sentence sent to you into Spanish and not add any notes or comments.

    If you enable "Enable live recording transcription export" in Preferences, Live text transcripts will be exported to a text file as they get generated and translated. This file can be used to further integrate Live transcripts with other applications like OBS Studio.

    Approximate cost of translation for 1 hour long audio with ChatGPT gpt-4o model is around $0.50.

    + \ No newline at end of file diff --git a/index.html b/index.html index 46467409..9ffa4786 100644 --- a/index.html +++ b/index.html @@ -4,13 +4,13 @@ Buzz - +
    - + \ No newline at end of file diff --git a/zh/404.html b/zh/404.html index 9392a2c6..7d9753bc 100644 --- a/zh/404.html +++ b/zh/404.html @@ -4,13 +4,13 @@ 找不到页面 | Buzz - +

    找不到页面

    我们找不到您要找的页面。

    请联系原始链接来源网站的所有者,并告知他们链接已损坏。

    - + \ No newline at end of file diff --git a/zh/assets/js/6ec58200.3dde5236.js b/zh/assets/js/6ec58200.d9b4199b.js similarity index 84% rename from zh/assets/js/6ec58200.3dde5236.js rename to zh/assets/js/6ec58200.d9b4199b.js index 16d7ba48..55960e89 100644 --- a/zh/assets/js/6ec58200.3dde5236.js +++ b/zh/assets/js/6ec58200.d9b4199b.js @@ -1 +1 @@ -"use strict";(self.webpackChunkdocs=self.webpackChunkdocs||[]).push([[150],{3905:(e,t,n)=>{n.d(t,{Zo:()=>l,kt:()=>m});var r=n(7294);function i(e,t,n){return t in e?Object.defineProperty(e,t,{value:n,enumerable:!0,configurable:!0,writable:!0}):e[t]=n,e}function a(e,t){var n=Object.keys(e);if(Object.getOwnPropertySymbols){var r=Object.getOwnPropertySymbols(e);t&&(r=r.filter((function(t){return Object.getOwnPropertyDescriptor(e,t).enumerable}))),n.push.apply(n,r)}return n}function o(e){for(var t=1;t=0||(i[n]=e[n]);return i}(e,t);if(Object.getOwnPropertySymbols){var a=Object.getOwnPropertySymbols(e);for(r=0;r=0||Object.prototype.propertyIsEnumerable.call(e,n)&&(i[n]=e[n])}return i}var c=r.createContext({}),p=function(e){var t=r.useContext(c),n=t;return e&&(n="function"==typeof e?e(t):o(o({},t),e)),n},l=function(e){var t=p(e.components);return r.createElement(c.Provider,{value:t},e.children)},u="mdxType",f={inlineCode:"code",wrapper:function(e){var t=e.children;return r.createElement(r.Fragment,{},t)}},d=r.forwardRef((function(e,t){var n=e.components,i=e.mdxType,a=e.originalType,c=e.parentName,l=s(e,["components","mdxType","originalType","parentName"]),u=p(n),d=i,m=u["".concat(c,".").concat(d)]||u[d]||f[d]||a;return n?r.createElement(m,o(o({ref:t},l),{},{components:n})):r.createElement(m,o({ref:t},l))}));function m(e,t){var n=arguments,i=t&&t.mdxType;if("string"==typeof e||i){var a=n.length,o=new Array(a);o[0]=d;var s={};for(var c in t)hasOwnProperty.call(t,c)&&(s[c]=t[c]);s.originalType=e,s[u]="string"==typeof e?e:i,o[1]=s;for(var p=2;p{n.r(t),n.d(t,{assets:()=>c,contentTitle:()=>o,default:()=>f,frontMatter:()=>a,metadata:()=>s,toc:()=>p});var r=n(7462),i=(n(7294),n(3905));const a={title:"Speaker identification"},o=void 0,s={unversionedId:"usage/speaker_identification",id:"usage/speaker_identification",title:"Speaker identification",description:"When transcript of some audio or video file is generated you can identify speakers in the transcript. Double-click the transcript in the list of transcripts to see additional options for editing and exporting.",source:"@site/docs/usage/5_speaker_identification.md",sourceDirName:"usage",slug:"/usage/speaker_identification",permalink:"/buzz/zh/docs/usage/speaker_identification",draft:!1,tags:[],version:"current",sidebarPosition:5,frontMatter:{title:"Speaker identification"},sidebar:"tutorialSidebar",previous:{title:"\u7f16\u8f91\u4e0e\u8c03\u6574",permalink:"/buzz/zh/docs/usage/edit_and_resize"},next:{title:"Transcription Viewer",permalink:"/buzz/zh/docs/usage/transcription_viewer"}},c={},p=[],l={toc:p},u="wrapper";function f(e){let{components:t,...n}=e;return(0,i.kt)(u,(0,r.Z)({},l,n,{components:t,mdxType:"MDXLayout"}),(0,i.kt)("p",null,"When transcript of some audio or video file is generated you can identify speakers in the transcript. Double-click the transcript in the list of transcripts to see additional options for editing and exporting."),(0,i.kt)("p",null,'Transcription view screen has option to identify speakers. Click on the "Identify speakers" button so see available options. '),(0,i.kt)("p",null,'If audio file is still present on the system speaker identification will mark each speakers sentences with appropriate label. You can preview 10 seconds of some random sentence of the identified speaker and rename the automatically identified label to speakers real name. If "Merge speaker sentences" checkbox is selected when you save the speaker labels, all consecutive sentences of the same speaker will be merged into one segment. Speaker identification is available since version 1.4.0 on all platforms except Intel macOS.'))}f.isMDXComponent=!0}}]); \ No newline at end of file +"use strict";(self.webpackChunkdocs=self.webpackChunkdocs||[]).push([[150],{3905:(e,t,n)=>{n.d(t,{Zo:()=>l,kt:()=>m});var r=n(7294);function i(e,t,n){return t in e?Object.defineProperty(e,t,{value:n,enumerable:!0,configurable:!0,writable:!0}):e[t]=n,e}function a(e,t){var n=Object.keys(e);if(Object.getOwnPropertySymbols){var r=Object.getOwnPropertySymbols(e);t&&(r=r.filter((function(t){return Object.getOwnPropertyDescriptor(e,t).enumerable}))),n.push.apply(n,r)}return n}function o(e){for(var t=1;t=0||(i[n]=e[n]);return i}(e,t);if(Object.getOwnPropertySymbols){var a=Object.getOwnPropertySymbols(e);for(r=0;r=0||Object.prototype.propertyIsEnumerable.call(e,n)&&(i[n]=e[n])}return i}var c=r.createContext({}),p=function(e){var t=r.useContext(c),n=t;return e&&(n="function"==typeof e?e(t):o(o({},t),e)),n},l=function(e){var t=p(e.components);return r.createElement(c.Provider,{value:t},e.children)},u="mdxType",d={inlineCode:"code",wrapper:function(e){var t=e.children;return r.createElement(r.Fragment,{},t)}},f=r.forwardRef((function(e,t){var n=e.components,i=e.mdxType,a=e.originalType,c=e.parentName,l=s(e,["components","mdxType","originalType","parentName"]),u=p(n),f=i,m=u["".concat(c,".").concat(f)]||u[f]||d[f]||a;return n?r.createElement(m,o(o({ref:t},l),{},{components:n})):r.createElement(m,o({ref:t},l))}));function m(e,t){var n=arguments,i=t&&t.mdxType;if("string"==typeof e||i){var a=n.length,o=new Array(a);o[0]=f;var s={};for(var c in t)hasOwnProperty.call(t,c)&&(s[c]=t[c]);s.originalType=e,s[u]="string"==typeof e?e:i,o[1]=s;for(var p=2;p{n.r(t),n.d(t,{assets:()=>c,contentTitle:()=>o,default:()=>d,frontMatter:()=>a,metadata:()=>s,toc:()=>p});var r=n(7462),i=(n(7294),n(3905));const a={title:"Speaker identification"},o=void 0,s={unversionedId:"usage/speaker_identification",id:"usage/speaker_identification",title:"Speaker identification",description:"When transcript of some audio or video file is generated you can identify speakers in the transcript. Double-click the transcript in the list of transcripts to see additional options for editing and exporting.",source:"@site/docs/usage/5_speaker_identification.md",sourceDirName:"usage",slug:"/usage/speaker_identification",permalink:"/buzz/zh/docs/usage/speaker_identification",draft:!1,tags:[],version:"current",sidebarPosition:5,frontMatter:{title:"Speaker identification"},sidebar:"tutorialSidebar",previous:{title:"\u7f16\u8f91\u4e0e\u8c03\u6574",permalink:"/buzz/zh/docs/usage/edit_and_resize"},next:{title:"Transcription Viewer",permalink:"/buzz/zh/docs/usage/transcription_viewer"}},c={},p=[],l={toc:p},u="wrapper";function d(e){let{components:t,...n}=e;return(0,i.kt)(u,(0,r.Z)({},l,n,{components:t,mdxType:"MDXLayout"}),(0,i.kt)("p",null,"When transcript of some audio or video file is generated you can identify speakers in the transcript. Double-click the transcript in the list of transcripts to see additional options for editing and exporting."),(0,i.kt)("p",null,'Transcription view screen has option to identify speakers. Click on the "Identify speakers" button so see available options. '),(0,i.kt)("p",null,'If audio file is still present on the system speaker identification will mark each speakers sentences with appropriate label. You can preview 10 seconds of some random sentence of the identified speaker and rename the automatically identified label to speakers real name. If "Merge speaker sentences" checkbox is selected when you save the speaker labels, all consecutive sentences of the same speaker will be merged into one segment. Speaker identification is not available on Intel macOS.'))}d.isMDXComponent=!0}}]); \ No newline at end of file diff --git a/zh/assets/js/dbcee777.062349f5.js b/zh/assets/js/dbcee777.062349f5.js new file mode 100644 index 00000000..621b8944 --- /dev/null +++ b/zh/assets/js/dbcee777.062349f5.js @@ -0,0 +1 @@ +"use strict";(self.webpackChunkdocs=self.webpackChunkdocs||[]).push([[598],{3905:(e,t,n)=>{n.d(t,{Zo:()=>u,kt:()=>d});var a=n(7294);function r(e,t,n){return t in e?Object.defineProperty(e,t,{value:n,enumerable:!0,configurable:!0,writable:!0}):e[t]=n,e}function i(e,t){var n=Object.keys(e);if(Object.getOwnPropertySymbols){var a=Object.getOwnPropertySymbols(e);t&&(a=a.filter((function(t){return Object.getOwnPropertyDescriptor(e,t).enumerable}))),n.push.apply(n,a)}return n}function l(e){for(var t=1;t=0||(r[n]=e[n]);return r}(e,t);if(Object.getOwnPropertySymbols){var i=Object.getOwnPropertySymbols(e);for(a=0;a=0||Object.prototype.propertyIsEnumerable.call(e,n)&&(r[n]=e[n])}return r}var s=a.createContext({}),p=function(e){var t=a.useContext(s),n=t;return e&&(n="function"==typeof e?e(t):l(l({},t),e)),n},u=function(e){var t=p(e.components);return a.createElement(s.Provider,{value:t},e.children)},m="mdxType",c={inlineCode:"code",wrapper:function(e){var t=e.children;return a.createElement(a.Fragment,{},t)}},k=a.forwardRef((function(e,t){var n=e.components,r=e.mdxType,i=e.originalType,s=e.parentName,u=o(e,["components","mdxType","originalType","parentName"]),m=p(n),k=r,d=m["".concat(s,".").concat(k)]||m[k]||c[k]||i;return n?a.createElement(d,l(l({ref:t},u),{},{components:n})):a.createElement(d,l({ref:t},u))}));function d(e,t){var n=arguments,r=t&&t.mdxType;if("string"==typeof e||r){var i=n.length,l=new Array(i);l[0]=k;var o={};for(var s in t)hasOwnProperty.call(t,s)&&(o[s]=t[s]);o.originalType=e,o[m]="string"==typeof e?e:r,l[1]=o;for(var p=2;p{n.r(t),n.d(t,{assets:()=>s,contentTitle:()=>l,default:()=>c,frontMatter:()=>i,metadata:()=>o,toc:()=>p});var a=n(7462),r=(n(7294),n(3905));const i={},l="Transcription Viewer",o={unversionedId:"usage/transcription_viewer",id:"usage/transcription_viewer",title:"Transcription Viewer",description:"The Buzz transcription viewer provides a powerful interface for reviewing, editing, and navigating through your transcriptions. This guide covers all the features available in the transcription viewer.",source:"@site/docs/usage/5_transcription_viewer.md",sourceDirName:"usage",slug:"/usage/transcription_viewer",permalink:"/buzz/zh/docs/usage/transcription_viewer",draft:!1,tags:[],version:"current",sidebarPosition:5,frontMatter:{},sidebar:"tutorialSidebar",previous:{title:"Speaker identification",permalink:"/buzz/zh/docs/usage/speaker_identification"},next:{title:"\u504f\u597d\u8bbe\u7f6e",permalink:"/buzz/zh/docs/preferences"}},s={},p=[{value:"Overview",id:"overview",level:2},{value:"Top Toolbar",id:"top-toolbar",level:2},{value:"View Mode Button",id:"view-mode-button",level:3},{value:"Export Button",id:"export-button",level:3},{value:"Translate Button",id:"translate-button",level:3},{value:"Resize Button",id:"resize-button",level:3},{value:"Playback Controls Button",id:"playback-controls-button",level:3},{value:"Find Button",id:"find-button",level:3},{value:"Scroll to Current Button",id:"scroll-to-current-button",level:3},{value:"Search Functionality",id:"search-functionality",level:2},{value:"Search Bar",id:"search-bar",level:3},{value:"Search Shortcuts",id:"search-shortcuts",level:3},{value:"Search Features",id:"search-features",level:3},{value:"Playback Controls",id:"playback-controls",level:2},{value:"Loop Segment",id:"loop-segment",level:3},{value:"Follow Audio",id:"follow-audio",level:3},{value:"Speed Controls",id:"speed-controls",level:3},{value:"Keyboard Shortcuts",id:"keyboard-shortcuts",level:2},{value:"Audio Playback",id:"audio-playback",level:3},{value:"Timestamp Adjustment",id:"timestamp-adjustment",level:3},{value:"Navigation",id:"navigation",level:3},{value:"Search",id:"search",level:3}],u={toc:p},m="wrapper";function c(e){let{components:t,...n}=e;return(0,r.kt)(m,(0,a.Z)({},u,n,{components:t,mdxType:"MDXLayout"}),(0,r.kt)("h1",{id:"transcription-viewer"},"Transcription Viewer"),(0,r.kt)("p",null,"The Buzz transcription viewer provides a powerful interface for reviewing, editing, and navigating through your transcriptions. This guide covers all the features available in the transcription viewer."),(0,r.kt)("h2",{id:"overview"},"Overview"),(0,r.kt)("p",null,"The transcription viewer is organized into several key sections:"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Top Toolbar"),": Contains view mode, export, translate, resize, and search"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Search Bar"),": Find and navigate through transcript text"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Transcription Segments"),": Table view of all transcription segments with timestamps"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Playback Controls"),": Audio playback settings and speed controls"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Audio Player"),": Standard media player with progress bar"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Current Segment Display"),": Shows the currently selected or playing segment")),(0,r.kt)("h2",{id:"top-toolbar"},"Top Toolbar"),(0,r.kt)("h3",{id:"view-mode-button"},"View Mode Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Switch between different viewing modes"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Options"),":",(0,r.kt)("ul",{parentName:"li"},(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Timestamps"),": Shows segments in a table format with start/end times"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Text"),": Shows combined text without timestamps"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Translation"),": Shows translated text (if available)")))),(0,r.kt)("h3",{id:"export-button"},"Export Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Export transcription in various formats"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Formats"),": SRT, VTT, TXT, JSON, and more"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),": Click to open export menu and select desired format")),(0,r.kt)("h3",{id:"translate-button"},"Translate Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Translate transcription to different languages"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),": Click to open translation settings and start translation")),(0,r.kt)("h3",{id:"resize-button"},"Resize Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Adjust transcription segment boundaries"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),": Click to open resize dialog for fine-tuning timestamps"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"More information"),": See ",(0,r.kt)("a",{parentName:"li",href:"https://chidiwilliams.github.io/buzz/docs/usage/edit_and_resize"},"Edit and Resize")," section")),(0,r.kt)("h3",{id:"playback-controls-button"},"Playback Controls Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Show/hide playback control panel"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Shortcut"),": ",(0,r.kt)("inlineCode",{parentName:"li"},"Ctrl+Alt+P")," (Windows/Linux) or ",(0,r.kt)("inlineCode",{parentName:"li"},"Cmd+Alt+P")," (macOS)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Behavior"),": Toggle button that shows/hides the playback controls below")),(0,r.kt)("h3",{id:"find-button"},"Find Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Show/hide search functionality"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Shortcut"),": ",(0,r.kt)("inlineCode",{parentName:"li"},"Ctrl+F")," (Windows/Linux) or ",(0,r.kt)("inlineCode",{parentName:"li"},"Cmd+F")," (macOS)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Behavior"),": Toggle button that shows/hides the search bar")),(0,r.kt)("h3",{id:"scroll-to-current-button"},"Scroll to Current Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Automatically scroll to the currently playing text"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Shortcut"),": ",(0,r.kt)("inlineCode",{parentName:"li"},"Ctrl+G")," (Windows/Linux) or ",(0,r.kt)("inlineCode",{parentName:"li"},"Cmd+G")," (macOS)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),": Click to jump to the current audio position in the transcript")),(0,r.kt)("h2",{id:"search-functionality"},"Search Functionality"),(0,r.kt)("h3",{id:"search-bar"},"Search Bar"),(0,r.kt)("p",null,"The search bar appears below the toolbar when activated and provides:"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Search Input"),": Type text to find in the transcription (wider input field for better usability)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Navigation"),": Up/down arrows to move between matches"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Status"),': Shows current match position and total matches (e.g., "3 of 15 matches")'),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Clear"),": Remove search text and results (larger button for better accessibility)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Results"),": Displays found text with context"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Consistent Button Sizing"),": All navigation buttons have uniform height for better visual consistency")),(0,r.kt)("h3",{id:"search-shortcuts"},"Search Shortcuts"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+F")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+F")),": Toggle search bar on/off"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Enter")),": Find next match"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Shift+Enter")),": Find previous match"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Escape")),": Close search bar")),(0,r.kt)("h3",{id:"search-features"},"Search Features"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Real-time Search"),": Results update as you type"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Case-insensitive"),": Finds matches regardless of capitalization"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Word Boundaries"),": Respects word boundaries for accurate matching"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Cross-view Search"),": Works in all view modes (Timestamps, Text, Translation)")),(0,r.kt)("h2",{id:"playback-controls"},"Playback Controls"),(0,r.kt)("h3",{id:"loop-segment"},"Loop Segment"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Automatically loop playback of selected segments"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),': Check the "Loop Segment" checkbox'),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Behavior"),": When enabled, clicking on a transcript segment will set a loop range"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Visual Feedback"),": Loop range is highlighted in the audio player")),(0,r.kt)("h3",{id:"follow-audio"},"Follow Audio"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Automatically scroll to current audio position"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),': Check the "Follow Audio" checkbox'),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Behavior"),": Transcript automatically follows the audio playback"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Benefits"),": Easy to follow along with long audio files")),(0,r.kt)("h3",{id:"speed-controls"},"Speed Controls"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Adjust audio playback speed"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Range"),": 0.5x to 2.0x speed"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Controls"),":",(0,r.kt)("ul",{parentName:"li"},(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Speed Dropdown"),": Select from preset speeds or enter custom value"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Decrease Button (-)"),": Reduce speed by 0.05x increments"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Increase Button (+)"),": Increase speed by 0.05x increments"))),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Persistence"),": Speed setting is saved between sessions"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Button Sizing"),": Speed control buttons match the size of search navigation buttons for visual consistency")),(0,r.kt)("h2",{id:"keyboard-shortcuts"},"Keyboard Shortcuts"),(0,r.kt)("h3",{id:"audio-playback"},"Audio Playback"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+P")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+P")),": Play/Pause audio"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+Shift+P")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+Shift+P")),": Replay current segment from start")),(0,r.kt)("h3",{id:"timestamp-adjustment"},"Timestamp Adjustment"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+\u2190")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+\u2190")),": Decrease segment start time by 0.5s"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+\u2192")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+\u2192")),": Increase segment start time by 0.5s"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+Shift+\u2190")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+Shift+\u2190")),": Decrease segment end time by 0.5s"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+Shift+\u2192")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+Shift+\u2192")),": Increase segment end time by 0.5s")),(0,r.kt)("h3",{id:"navigation"},"Navigation"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+F")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+F")),": Toggle search bar"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+Alt+P")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+Alt+P")),": Toggle playback controls"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+G")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+G")),": Scroll to current position"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+O")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+O")),": Open file import dialog")),(0,r.kt)("h3",{id:"search"},"Search"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Enter")),": Find next match"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Shift+Enter")),": Find previous match"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Escape")),": Close search bar")))}c.isMDXComponent=!0}}]); \ No newline at end of file diff --git a/zh/assets/js/dbcee777.7a7cfd52.js b/zh/assets/js/dbcee777.7a7cfd52.js deleted file mode 100644 index cc02f86f..00000000 --- a/zh/assets/js/dbcee777.7a7cfd52.js +++ /dev/null @@ -1 +0,0 @@ -"use strict";(self.webpackChunkdocs=self.webpackChunkdocs||[]).push([[598],{3905:(e,t,n)=>{n.d(t,{Zo:()=>u,kt:()=>d});var a=n(7294);function r(e,t,n){return t in e?Object.defineProperty(e,t,{value:n,enumerable:!0,configurable:!0,writable:!0}):e[t]=n,e}function i(e,t){var n=Object.keys(e);if(Object.getOwnPropertySymbols){var a=Object.getOwnPropertySymbols(e);t&&(a=a.filter((function(t){return Object.getOwnPropertyDescriptor(e,t).enumerable}))),n.push.apply(n,a)}return n}function l(e){for(var t=1;t=0||(r[n]=e[n]);return r}(e,t);if(Object.getOwnPropertySymbols){var i=Object.getOwnPropertySymbols(e);for(a=0;a=0||Object.prototype.propertyIsEnumerable.call(e,n)&&(r[n]=e[n])}return r}var s=a.createContext({}),p=function(e){var t=a.useContext(s),n=t;return e&&(n="function"==typeof e?e(t):l(l({},t),e)),n},u=function(e){var t=p(e.components);return a.createElement(s.Provider,{value:t},e.children)},m="mdxType",c={inlineCode:"code",wrapper:function(e){var t=e.children;return a.createElement(a.Fragment,{},t)}},k=a.forwardRef((function(e,t){var n=e.components,r=e.mdxType,i=e.originalType,s=e.parentName,u=o(e,["components","mdxType","originalType","parentName"]),m=p(n),k=r,d=m["".concat(s,".").concat(k)]||m[k]||c[k]||i;return n?a.createElement(d,l(l({ref:t},u),{},{components:n})):a.createElement(d,l({ref:t},u))}));function d(e,t){var n=arguments,r=t&&t.mdxType;if("string"==typeof e||r){var i=n.length,l=new Array(i);l[0]=k;var o={};for(var s in t)hasOwnProperty.call(t,s)&&(o[s]=t[s]);o.originalType=e,o[m]="string"==typeof e?e:r,l[1]=o;for(var p=2;p{n.r(t),n.d(t,{assets:()=>s,contentTitle:()=>l,default:()=>c,frontMatter:()=>i,metadata:()=>o,toc:()=>p});var a=n(7462),r=(n(7294),n(3905));const i={},l="Transcription Viewer",o={unversionedId:"usage/transcription_viewer",id:"usage/transcription_viewer",title:"Transcription Viewer",description:"The Buzz transcription viewer provides a powerful interface for reviewing, editing, and navigating through your transcriptions. This guide covers all the features available in the transcription viewer.",source:"@site/docs/usage/5_transcription_viewer.md",sourceDirName:"usage",slug:"/usage/transcription_viewer",permalink:"/buzz/zh/docs/usage/transcription_viewer",draft:!1,tags:[],version:"current",sidebarPosition:5,frontMatter:{},sidebar:"tutorialSidebar",previous:{title:"Speaker identification",permalink:"/buzz/zh/docs/usage/speaker_identification"},next:{title:"\u504f\u597d\u8bbe\u7f6e",permalink:"/buzz/zh/docs/preferences"}},s={},p=[{value:"Overview",id:"overview",level:2},{value:"Top Toolbar",id:"top-toolbar",level:2},{value:"View Mode Button",id:"view-mode-button",level:3},{value:"Export Button",id:"export-button",level:3},{value:"Translate Button",id:"translate-button",level:3},{value:"Resize Button",id:"resize-button",level:3},{value:"Playback Controls Button",id:"playback-controls-button",level:3},{value:"Find Button",id:"find-button",level:3},{value:"Scroll to Current Button",id:"scroll-to-current-button",level:3},{value:"Search Functionality",id:"search-functionality",level:2},{value:"Search Bar",id:"search-bar",level:3},{value:"Search Shortcuts",id:"search-shortcuts",level:3},{value:"Search Features",id:"search-features",level:3},{value:"Playback Controls",id:"playback-controls",level:2},{value:"Loop Segment",id:"loop-segment",level:3},{value:"Follow Audio",id:"follow-audio",level:3},{value:"Speed Controls",id:"speed-controls",level:3},{value:"Keyboard Shortcuts",id:"keyboard-shortcuts",level:2},{value:"Audio Playback",id:"audio-playback",level:3},{value:"Timestamp Adjustment",id:"timestamp-adjustment",level:3},{value:"Navigation",id:"navigation",level:3},{value:"Search",id:"search",level:3}],u={toc:p},m="wrapper";function c(e){let{components:t,...n}=e;return(0,r.kt)(m,(0,a.Z)({},u,n,{components:t,mdxType:"MDXLayout"}),(0,r.kt)("h1",{id:"transcription-viewer"},"Transcription Viewer"),(0,r.kt)("p",null,"The Buzz transcription viewer provides a powerful interface for reviewing, editing, and navigating through your transcriptions. This guide covers all the features available in the transcription viewer."),(0,r.kt)("h2",{id:"overview"},"Overview"),(0,r.kt)("p",null,"The transcription viewer is organized into several key sections:"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Top Toolbar"),": Contains view mode, export, translate, resize, and search"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Search Bar"),": Find and navigate through transcript text"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Transcription Segments"),": Table view of all transcription segments with timestamps"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Playback Controls"),": Audio playback settings and speed controls (since version 1.3.0)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Audio Player"),": Standard media player with progress bar"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Current Segment Display"),": Shows the currently selected or playing segment")),(0,r.kt)("h2",{id:"top-toolbar"},"Top Toolbar"),(0,r.kt)("h3",{id:"view-mode-button"},"View Mode Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Switch between different viewing modes"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Options"),":",(0,r.kt)("ul",{parentName:"li"},(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Timestamps"),": Shows segments in a table format with start/end times"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Text"),": Shows combined text without timestamps"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Translation"),": Shows translated text (if available)")))),(0,r.kt)("h3",{id:"export-button"},"Export Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Export transcription in various formats"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Formats"),": SRT, VTT, TXT, JSON, and more"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),": Click to open export menu and select desired format")),(0,r.kt)("h3",{id:"translate-button"},"Translate Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Translate transcription to different languages"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),": Click to open translation settings and start translation")),(0,r.kt)("h3",{id:"resize-button"},"Resize Button"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Adjust transcription segment boundaries"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),": Click to open resize dialog for fine-tuning timestamps"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"More information"),": See ",(0,r.kt)("a",{parentName:"li",href:"https://chidiwilliams.github.io/buzz/docs/usage/edit_and_resize"},"Edit and Resize")," section")),(0,r.kt)("h3",{id:"playback-controls-button"},"Playback Controls Button"),(0,r.kt)("p",null,"(since version 1.3.0)"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Show/hide playback control panel"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Shortcut"),": ",(0,r.kt)("inlineCode",{parentName:"li"},"Ctrl+Alt+P")," (Windows/Linux) or ",(0,r.kt)("inlineCode",{parentName:"li"},"Cmd+Alt+P")," (macOS)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Behavior"),": Toggle button that shows/hides the playback controls below")),(0,r.kt)("h3",{id:"find-button"},"Find Button"),(0,r.kt)("p",null,"(since version 1.3.0)"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Show/hide search functionality"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Shortcut"),": ",(0,r.kt)("inlineCode",{parentName:"li"},"Ctrl+F")," (Windows/Linux) or ",(0,r.kt)("inlineCode",{parentName:"li"},"Cmd+F")," (macOS)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Behavior"),": Toggle button that shows/hides the search bar")),(0,r.kt)("h3",{id:"scroll-to-current-button"},"Scroll to Current Button"),(0,r.kt)("p",null,"(since version 1.3.0)"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Automatically scroll to the currently playing text"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Shortcut"),": ",(0,r.kt)("inlineCode",{parentName:"li"},"Ctrl+G")," (Windows/Linux) or ",(0,r.kt)("inlineCode",{parentName:"li"},"Cmd+G")," (macOS)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),": Click to jump to the current audio position in the transcript")),(0,r.kt)("h2",{id:"search-functionality"},"Search Functionality"),(0,r.kt)("p",null,"(since version 1.3.0)"),(0,r.kt)("h3",{id:"search-bar"},"Search Bar"),(0,r.kt)("p",null,"The search bar appears below the toolbar when activated and provides:"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Search Input"),": Type text to find in the transcription (wider input field for better usability)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Navigation"),": Up/down arrows to move between matches"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Status"),': Shows current match position and total matches (e.g., "3 of 15 matches")'),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Clear"),": Remove search text and results (larger button for better accessibility)"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Results"),": Displays found text with context"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Consistent Button Sizing"),": All navigation buttons have uniform height for better visual consistency")),(0,r.kt)("h3",{id:"search-shortcuts"},"Search Shortcuts"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+F")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+F")),": Toggle search bar on/off"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Enter")),": Find next match"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Shift+Enter")),": Find previous match"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Escape")),": Close search bar")),(0,r.kt)("h3",{id:"search-features"},"Search Features"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Real-time Search"),": Results update as you type"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Case-insensitive"),": Finds matches regardless of capitalization"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Word Boundaries"),": Respects word boundaries for accurate matching"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Cross-view Search"),": Works in all view modes (Timestamps, Text, Translation)")),(0,r.kt)("h2",{id:"playback-controls"},"Playback Controls"),(0,r.kt)("p",null,"(since version 1.3.0)"),(0,r.kt)("h3",{id:"loop-segment"},"Loop Segment"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Automatically loop playback of selected segments"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),': Check the "Loop Segment" checkbox'),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Behavior"),": When enabled, clicking on a transcript segment will set a loop range"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Visual Feedback"),": Loop range is highlighted in the audio player")),(0,r.kt)("h3",{id:"follow-audio"},"Follow Audio"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Automatically scroll to current audio position"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Usage"),': Check the "Follow Audio" checkbox'),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Behavior"),": Transcript automatically follows the audio playback"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Benefits"),": Easy to follow along with long audio files")),(0,r.kt)("h3",{id:"speed-controls"},"Speed Controls"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Function"),": Adjust audio playback speed"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Range"),": 0.5x to 2.0x speed"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Controls"),":",(0,r.kt)("ul",{parentName:"li"},(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Speed Dropdown"),": Select from preset speeds or enter custom value"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Decrease Button (-)"),": Reduce speed by 0.05x increments"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Increase Button (+)"),": Increase speed by 0.05x increments"))),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Persistence"),": Speed setting is saved between sessions"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},"Button Sizing"),": Speed control buttons match the size of search navigation buttons for visual consistency")),(0,r.kt)("h2",{id:"keyboard-shortcuts"},"Keyboard Shortcuts"),(0,r.kt)("p",null,"(since version 1.3.0)"),(0,r.kt)("h3",{id:"audio-playback"},"Audio Playback"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+P")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+P")),": Play/Pause audio"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+Shift+P")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+Shift+P")),": Replay current segment from start")),(0,r.kt)("h3",{id:"timestamp-adjustment"},"Timestamp Adjustment"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+\u2190")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+\u2190")),": Decrease segment start time by 0.5s"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+\u2192")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+\u2192")),": Increase segment start time by 0.5s"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+Shift+\u2190")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+Shift+\u2190")),": Decrease segment end time by 0.5s"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+Shift+\u2192")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+Shift+\u2192")),": Increase segment end time by 0.5s")),(0,r.kt)("h3",{id:"navigation"},"Navigation"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+F")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+F")),": Toggle search bar"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+Alt+P")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+Alt+P")),": Toggle playback controls"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+G")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+G")),": Scroll to current position"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Ctrl+O")," / ",(0,r.kt)("inlineCode",{parentName:"strong"},"Cmd+O")),": Open file import dialog")),(0,r.kt)("h3",{id:"search"},"Search"),(0,r.kt)("ul",null,(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Enter")),": Find next match"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Shift+Enter")),": Find previous match"),(0,r.kt)("li",{parentName:"ul"},(0,r.kt)("strong",{parentName:"li"},(0,r.kt)("inlineCode",{parentName:"strong"},"Escape")),": Close search bar")))}c.isMDXComponent=!0}}]); \ No newline at end of file diff --git a/zh/assets/js/runtime~main.9b45ef3c.js b/zh/assets/js/runtime~main.9b45ef3c.js new file mode 100644 index 00000000..f08998f7 --- /dev/null +++ b/zh/assets/js/runtime~main.9b45ef3c.js @@ -0,0 +1 @@ +(()=>{"use strict";var e,t,r,o,a,n={},d={};function c(e){var t=d[e];if(void 0!==t)return t.exports;var r=d[e]={id:e,loaded:!1,exports:{}};return n[e].call(r.exports,r,r.exports,c),r.loaded=!0,r.exports}c.m=n,c.c=d,e=[],c.O=(t,r,o,a)=>{if(!r){var n=1/0;for(u=0;u=a)&&Object.keys(c.O).every((e=>c.O[e](r[f])))?r.splice(f--,1):(d=!1,a0&&e[u-1][2]>a;u--)e[u]=e[u-1];e[u]=[r,o,a]},c.n=e=>{var t=e&&e.__esModule?()=>e.default:()=>e;return c.d(t,{a:t}),t},r=Object.getPrototypeOf?e=>Object.getPrototypeOf(e):e=>e.__proto__,c.t=function(e,o){if(1&o&&(e=this(e)),8&o)return e;if("object"==typeof e&&e){if(4&o&&e.__esModule)return e;if(16&o&&"function"==typeof e.then)return e}var a=Object.create(null);c.r(a);var n={};t=t||[null,r({}),r([]),r(r)];for(var d=2&o&&e;"object"==typeof d&&!~t.indexOf(d);d=r(d))Object.getOwnPropertyNames(d).forEach((t=>n[t]=()=>e[t]));return n.default=()=>e,c.d(a,n),a},c.d=(e,t)=>{for(var r in t)c.o(t,r)&&!c.o(e,r)&&Object.defineProperty(e,r,{enumerable:!0,get:t[r]})},c.f={},c.e=e=>Promise.all(Object.keys(c.f).reduce(((t,r)=>(c.f[r](e,t),t)),[])),c.u=e=>"assets/js/"+({53:"935f2afb",143:"42a922e9",150:"6ec58200",218:"8d0b11da",237:"1df93b7f",255:"dca12369",271:"93f51c74",310:"a6c9f398",514:"1be78505",598:"dbcee777",675:"2962c32e",741:"bde536f8",860:"3e407b54",870:"92d66db1",918:"17896441",958:"6dbc2e00",995:"076ee139"}[e]||e)+"."+{53:"52c36f3c",143:"1e0b6b58",150:"d9b4199b",218:"eb9558d9",237:"71d7b441",255:"4d73fbd0",271:"edefd04a",310:"13ca4f4b",514:"131974b6",598:"062349f5",675:"6182228c",741:"5bb9f476",860:"987a7018",870:"07fedd0a",918:"0aaaf3b3",958:"24fcb0eb",972:"d5cc17b1",995:"b8a84e34"}[e]+".js",c.miniCssF=e=>{},c.g=function(){if("object"==typeof globalThis)return globalThis;try{return this||new Function("return this")()}catch(e){if("object"==typeof window)return window}}(),c.o=(e,t)=>Object.prototype.hasOwnProperty.call(e,t),o={},a="docs:",c.l=(e,t,r,n)=>{if(o[e])o[e].push(t);else{var d,f;if(void 0!==r)for(var i=document.getElementsByTagName("script"),u=0;u{d.onerror=d.onload=null,clearTimeout(s);var a=o[e];if(delete o[e],d.parentNode&&d.parentNode.removeChild(d),a&&a.forEach((e=>e(r))),t)return t(r)},s=setTimeout(l.bind(null,void 0,{type:"timeout",target:d}),12e4);d.onerror=l.bind(null,d.onerror),d.onload=l.bind(null,d.onload),f&&document.head.appendChild(d)}},c.r=e=>{"undefined"!=typeof Symbol&&Symbol.toStringTag&&Object.defineProperty(e,Symbol.toStringTag,{value:"Module"}),Object.defineProperty(e,"__esModule",{value:!0})},c.p="/buzz/zh/",c.gca=function(e){return e={17896441:"918","935f2afb":"53","42a922e9":"143","6ec58200":"150","8d0b11da":"218","1df93b7f":"237",dca12369:"255","93f51c74":"271",a6c9f398:"310","1be78505":"514",dbcee777:"598","2962c32e":"675",bde536f8:"741","3e407b54":"860","92d66db1":"870","6dbc2e00":"958","076ee139":"995"}[e]||e,c.p+c.u(e)},(()=>{var e={303:0,532:0};c.f.j=(t,r)=>{var o=c.o(e,t)?e[t]:void 0;if(0!==o)if(o)r.push(o[2]);else if(/^(303|532)$/.test(t))e[t]=0;else{var a=new Promise(((r,a)=>o=e[t]=[r,a]));r.push(o[2]=a);var n=c.p+c.u(t),d=new Error;c.l(n,(r=>{if(c.o(e,t)&&(0!==(o=e[t])&&(e[t]=void 0),o)){var a=r&&("load"===r.type?"missing":r.type),n=r&&r.target&&r.target.src;d.message="Loading chunk "+t+" failed.\n("+a+": "+n+")",d.name="ChunkLoadError",d.type=a,d.request=n,o[1](d)}}),"chunk-"+t,t)}},c.O.j=t=>0===e[t];var t=(t,r)=>{var o,a,n=r[0],d=r[1],f=r[2],i=0;if(n.some((t=>0!==e[t]))){for(o in d)c.o(d,o)&&(c.m[o]=d[o]);if(f)var u=f(c)}for(t&&t(r);i{"use strict";var e,t,r,o,a,n={},d={};function f(e){var t=d[e];if(void 0!==t)return t.exports;var r=d[e]={id:e,loaded:!1,exports:{}};return n[e].call(r.exports,r,r.exports,f),r.loaded=!0,r.exports}f.m=n,f.c=d,e=[],f.O=(t,r,o,a)=>{if(!r){var n=1/0;for(u=0;u=a)&&Object.keys(f.O).every((e=>f.O[e](r[c])))?r.splice(c--,1):(d=!1,a0&&e[u-1][2]>a;u--)e[u]=e[u-1];e[u]=[r,o,a]},f.n=e=>{var t=e&&e.__esModule?()=>e.default:()=>e;return f.d(t,{a:t}),t},r=Object.getPrototypeOf?e=>Object.getPrototypeOf(e):e=>e.__proto__,f.t=function(e,o){if(1&o&&(e=this(e)),8&o)return e;if("object"==typeof e&&e){if(4&o&&e.__esModule)return e;if(16&o&&"function"==typeof e.then)return e}var a=Object.create(null);f.r(a);var n={};t=t||[null,r({}),r([]),r(r)];for(var d=2&o&&e;"object"==typeof d&&!~t.indexOf(d);d=r(d))Object.getOwnPropertyNames(d).forEach((t=>n[t]=()=>e[t]));return n.default=()=>e,f.d(a,n),a},f.d=(e,t)=>{for(var r in t)f.o(t,r)&&!f.o(e,r)&&Object.defineProperty(e,r,{enumerable:!0,get:t[r]})},f.f={},f.e=e=>Promise.all(Object.keys(f.f).reduce(((t,r)=>(f.f[r](e,t),t)),[])),f.u=e=>"assets/js/"+({53:"935f2afb",143:"42a922e9",150:"6ec58200",218:"8d0b11da",237:"1df93b7f",255:"dca12369",271:"93f51c74",310:"a6c9f398",514:"1be78505",598:"dbcee777",675:"2962c32e",741:"bde536f8",860:"3e407b54",870:"92d66db1",918:"17896441",958:"6dbc2e00",995:"076ee139"}[e]||e)+"."+{53:"52c36f3c",143:"1e0b6b58",150:"3dde5236",218:"eb9558d9",237:"71d7b441",255:"4d73fbd0",271:"edefd04a",310:"13ca4f4b",514:"131974b6",598:"7a7cfd52",675:"6182228c",741:"5bb9f476",860:"987a7018",870:"07fedd0a",918:"0aaaf3b3",958:"24fcb0eb",972:"d5cc17b1",995:"b8a84e34"}[e]+".js",f.miniCssF=e=>{},f.g=function(){if("object"==typeof globalThis)return globalThis;try{return this||new Function("return this")()}catch(e){if("object"==typeof window)return window}}(),f.o=(e,t)=>Object.prototype.hasOwnProperty.call(e,t),o={},a="docs:",f.l=(e,t,r,n)=>{if(o[e])o[e].push(t);else{var d,c;if(void 0!==r)for(var i=document.getElementsByTagName("script"),u=0;u{d.onerror=d.onload=null,clearTimeout(s);var a=o[e];if(delete o[e],d.parentNode&&d.parentNode.removeChild(d),a&&a.forEach((e=>e(r))),t)return t(r)},s=setTimeout(l.bind(null,void 0,{type:"timeout",target:d}),12e4);d.onerror=l.bind(null,d.onerror),d.onload=l.bind(null,d.onload),c&&document.head.appendChild(d)}},f.r=e=>{"undefined"!=typeof Symbol&&Symbol.toStringTag&&Object.defineProperty(e,Symbol.toStringTag,{value:"Module"}),Object.defineProperty(e,"__esModule",{value:!0})},f.p="/buzz/zh/",f.gca=function(e){return e={17896441:"918","935f2afb":"53","42a922e9":"143","6ec58200":"150","8d0b11da":"218","1df93b7f":"237",dca12369:"255","93f51c74":"271",a6c9f398:"310","1be78505":"514",dbcee777:"598","2962c32e":"675",bde536f8:"741","3e407b54":"860","92d66db1":"870","6dbc2e00":"958","076ee139":"995"}[e]||e,f.p+f.u(e)},(()=>{var e={303:0,532:0};f.f.j=(t,r)=>{var o=f.o(e,t)?e[t]:void 0;if(0!==o)if(o)r.push(o[2]);else if(/^(303|532)$/.test(t))e[t]=0;else{var a=new Promise(((r,a)=>o=e[t]=[r,a]));r.push(o[2]=a);var n=f.p+f.u(t),d=new Error;f.l(n,(r=>{if(f.o(e,t)&&(0!==(o=e[t])&&(e[t]=void 0),o)){var a=r&&("load"===r.type?"missing":r.type),n=r&&r.target&&r.target.src;d.message="Loading chunk "+t+" failed.\n("+a+": "+n+")",d.name="ChunkLoadError",d.type=a,d.request=n,o[1](d)}}),"chunk-"+t,t)}},f.O.j=t=>0===e[t];var t=(t,r)=>{var o,a,n=r[0],d=r[1],c=r[2],i=0;if(n.some((t=>0!==e[t]))){for(o in d)f.o(d,o)&&(f.m[o]=d[o]);if(c)var u=c(f)}for(t&&t(r);i 介绍 | Buzz - + @@ -17,7 +17,7 @@ Whisper.cppFaster WhisperWhisper 兼容的 Hugging Face 模型OpenAI Whisper API
  • 命令行界面
  • 支持 Mac、Windows 和 Linux
  • - + \ No newline at end of file diff --git a/zh/docs/cli.html b/zh/docs/cli.html index 7e329ae3..23662cd0 100644 --- a/zh/docs/cli.html +++ b/zh/docs/cli.html @@ -4,13 +4,13 @@ 命令行界面 (CLI) | Buzz - +

    命令行界面 (CLI)

    命令

    增加

    启动一个新的转录任务。

    Usage: buzz add [options] [file url file...]

    Options:
    -t, --task <task> The task to perform. Allowed: translate,
    transcribe. Default: transcribe.
    -m, --model-type <model-type> Model type. Allowed: whisper, whispercpp,
    huggingface, fasterwhisper, openaiapi. Default:
    whisper.
    -s, --model-size <model-size> Model size. Use only when --model-type is
    whisper, whispercpp, or fasterwhisper. Allowed:
    tiny, base, small, medium, large. Default:
    tiny.
    --hfid <id> Hugging Face model ID. Use only when
    --model-type is huggingface. Example:
    "openai/whisper-tiny"
    -l, --language <code> Language code. Allowed: af (Afrikaans), am
    (Amharic), ar (Arabic), as (Assamese), az
    (Azerbaijani), ba (Bashkir), be (Belarusian),
    bg (Bulgarian), bn (Bengali), bo (Tibetan), br
    (Breton), bs (Bosnian), ca (Catalan), cs
    (Czech), cy (Welsh), da (Danish), de (German),
    el (Greek), en (English), es (Spanish), et
    (Estonian), eu (Basque), fa (Persian), fi
    (Finnish), fo (Faroese), fr (French), gl
    (Galician), gu (Gujarati), ha (Hausa), haw
    (Hawaiian), he (Hebrew), hi (Hindi), hr
    (Croatian), ht (Haitian Creole), hu
    (Hungarian), hy (Armenian), id (Indonesian), is
    (Icelandic), it (Italian), ja (Japanese), jw
    (Javanese), ka (Georgian), kk (Kazakh), km
    (Khmer), kn (Kannada), ko (Korean), la (Latin),
    lb (Luxembourgish), ln (Lingala), lo (Lao), lt
    (Lithuanian), lv (Latvian), mg (Malagasy), mi
    (Maori), mk (Macedonian), ml (Malayalam), mn
    (Mongolian), mr (Marathi), ms (Malay), mt
    (Maltese), my (Myanmar), ne (Nepali), nl
    (Dutch), nn (Nynorsk), no (Norwegian), oc
    (Occitan), pa (Punjabi), pl (Polish), ps
    (Pashto), pt (Portuguese), ro (Romanian), ru
    (Russian), sa (Sanskrit), sd (Sindhi), si
    (Sinhala), sk (Slovak), sl (Slovenian), sn
    (Shona), so (Somali), sq (Albanian), sr
    (Serbian), su (Sundanese), sv (Swedish), sw
    (Swahili), ta (Tamil), te (Telugu), tg (Tajik),
    th (Thai), tk (Turkmen), tl (Tagalog), tr
    (Turkish), tt (Tatar), uk (Ukrainian), ur
    (Urdu), uz (Uzbek), vi (Vietnamese), yi
    (Yiddish), yo (Yoruba), zh (Chinese). Leave
    empty to detect language.
    -p, --prompt <prompt> Initial prompt.
    -w, --word-timestamps Generate word-level timestamps. (available since 1.2.0)
    --openai-token <token> OpenAI access token. Use only when
    --model-type is openaiapi. Defaults to your
    previously saved access token, if one exists.
    --srt Output result in an SRT file.
    --vtt Output result in a VTT file.
    --txt Output result in a TXT file.
    --hide-gui Hide the main application window. (available since 1.2.0)
    -h, --help Displays help on commandline options.
    --help-all Displays help including Qt specific options.
    -v, --version Displays version information.

    Arguments:
    files or urls Input file paths or urls. Url import availalbe since 1.2.0.

    示例:

    # 使用 OpenAI Whisper API 将两个 MP3 文件从法语翻译为英语
    buzz add --task translate --language fr --model-type openaiapi /Users/user/Downloads/1b3b03e4-8db5-ea2c-ace5-b71ff32e3304.mp3 /Users/user/Downloads/koaf9083k1lkpsfdi0.mp3

    # 使用 Whisper.cpp "small" 模型转录一个 MP4 文件,并立即导出为 SRT 和 VTT 文件
    buzz add --task transcribe --model-type whispercpp --model-size small --prompt "My initial prompt(我的初始提示)" --srt --vtt /Users/user/Downloads/buzz/1b3b03e4-8db5-ea2c-ace5-b71ff32e3304.mp4
    - + \ No newline at end of file diff --git a/zh/docs/faq.html b/zh/docs/faq.html index e424d94e..1428c5e6 100644 --- a/zh/docs/faq.html +++ b/zh/docs/faq.html @@ -4,13 +4,13 @@ 常见问题(FAQ) | Buzz - +

    常见问题(FAQ)

    1. 模型存储在哪里?

    模型存储在以下位置:

    • Linux: ~/.cache/Buzz
    • Mac OS: ~/Library/Caches/Buzz
    • Windows: %USERPROFILE%\AppData\Local\Buzz\Buzz\Cache

    将上述路径粘贴到文件管理器中即可访问模型。

    2. 如果转录速度太慢,我可以尝试什么?

    语音识别需要大量计算资源,您可以尝试使用较小的 Whisper 模型,或者使用 Whisper.cpp 模型在本地计算机上运行语音识别。如果您的计算机配备了至少 6GB VRAM 的 GPU,可以尝试使用 Faster Whisper 模型。

    Buzz 还支持使用 OpenAI API 在远程服务器上进行语音识别。要使用此功能,您需要在“偏好设置”中设置 OpenAI API 密钥。详情请参见 偏好设置 部分。

    3. 如何录制系统音频?

    要转录系统音频,您需要配置虚拟音频设备,并将希望转录的应用程序输出连接到该虚拟扬声器。然后,您可以在 Buzz 中选择该设备作为音源。详情请参见 使用指南 部分。

    相关工具:

    4. 我应该使用哪个模型?

    选择模型大小取决于您的硬件和使用场景。较小的模型运行速度更快,但准确性较低;较大的模型更准确,但需要更强的硬件或更长的转录时间。

    在选择大模型时,请参考以下信息:

    • “Large” 是最早发布的模型
    • “Large-V2” 是后续改进版,准确率更高,被认为是某些语言中最稳定的选择
    • “Large-V3” 是最新版本,在许多情况下准确性最佳,但有时可能会产生错误的单词
    • “Turbo” 模型在速度和准确性之间取得了良好平衡

    最好的方法是测试所有模型,以找到最适合您语言的选项。

    5. 如何使用 GPU 加速以提高转录速度?

    • Linux 上,Nvidia GPU 受支持,可直接使用 GPU 加速。如果遇到问题,请安装 CUDA 12cuBLAScuDNN
    • Windows 上,请参阅此说明 以启用 CUDA GPU 支持。
    • Faster Whisper 需要 CUDA 12,使用旧版 CUDA 的计算机将默认使用 CPU。

    6. 如何修复 Unanticipated host error[PaErrorCode-9999]

    请检查系统设置,确保没有阻止应用访问麦克风。

    • Windows 用户请检查“设置 -> 隐私 -> 麦克风”,确保 Buzz 有权限使用麦克风。
    • 参考此视频的 方法 1
    • 方法 2 无需卸载防病毒软件,但可以尝试暂时禁用,或检查是否有相关设置阻止 Buzz 访问麦克风。

    7. 可以在没有互联网的计算机上使用 Buzz 吗?

    是的,您可以在离线计算机上使用 Buzz,但需要在另一台联网计算机上下载所需模型,并手动将其移动到离线计算机。

    最简单的方法是:

    1. 打开“帮助 -> 偏好设置 -> 模型”
    2. 下载所需的模型
    3. 点击“显示文件位置”按钮,打开存储模型的文件夹
    4. 将该模型文件夹复制到离线计算机的相同位置

    例如,在 Linux 上,模型存储在 ~/.cache/Buzz/models 目录中。

    8. Buzz 崩溃了,怎么办?

    如果模型下载不完整或损坏,Buzz 可能会崩溃。尝试删除已下载的模型文件,然后重新下载。

    如果问题仍然存在,请检查日志文件并报告问题,以便我们修复。日志文件位置如下:

    • Mac OS: ~/Library/Logs/Buzz
    • Windows: %USERPROFILE%\AppData\Local\Buzz\Buzz\Logs
    • Linux: 在终端运行 Buzz 查看相关错误信息。

    9. 哪里可以获取最新的开发版本?

    最新的开发版本包含最新的错误修复和新功能。如果您喜欢尝试新功能,可以下载最新的开发版本进行测试。

    • Linux 用户可以运行以下命令获取最新版本:
      sudo snap install buzz --edge
    • 其他平台 请按以下步骤操作:
      1. 访问 构建页面
      2. 点击最新构建的链接
      3. 在构建页面向下滚动到“Artifacts”部分
      4. 下载安装文件(请注意,您需要登录 GitHub 才能看到下载链接)
    - + \ No newline at end of file diff --git a/zh/docs/installation.html b/zh/docs/installation.html index 1084f2ec..5c2ce6d8 100644 --- a/zh/docs/installation.html +++ b/zh/docs/installation.html @@ -4,13 +4,13 @@ 安装 | Buzz - +

    安装

    要安装 Buzz,请下载适用于您操作系统的最新版本。Buzz 支持 Mac(Intel)、WindowsLinux 系统。

    macOS(Intel,macOS 11.7 及更高版本)

    通过 brew 安装:

    brew install --cask buzz

    或者,下载并运行 Buzz-x.y.z.dmg 文件。

    对于 Mac Silicon 用户(以及希望在 Mac Intel 上获得更好体验的用户)。

    Windows(Windows 10 及更高版本)

    下载并运行 Buzz-x.y.z.exe 文件。

    Linux

    sudo apt-get install libportaudio2 libcanberra-gtk-module libcanberra-gtk3-module
    sudo snap install buzz
    sudo snap connect buzz:password-manager-service

    从 Snap Store 获取

    或者,在 Ubuntu 20.04 及更高版本上,安装依赖项:

    sudo apt-get install libportaudio2

    然后,下载并解压 Buzz-x.y.z-unix.tar.gz 文件。

    PyPI

    pip install buzz-captions
    python -m buzz
    - + \ No newline at end of file diff --git a/zh/docs/preferences.html b/zh/docs/preferences.html index 8041b8c8..01716a2f 100644 --- a/zh/docs/preferences.html +++ b/zh/docs/preferences.html @@ -4,7 +4,7 @@ 偏好设置 | Buzz - + @@ -15,7 +15,7 @@ 在具有 16 线程的笔记本电脑上,设置 BUZZ_WHISPERCPP_N_THREADS=8 可以使转录时间加快约 15%。
    进一步增加线程数会导致转录时间变慢,因为并行线程的结果需要合并以生成最终答案。

    BUZZ_TRANSLATION_API_BASE_URl - 用于翻译的 OpenAI 兼容 API 的基础 URL。

    BUZZ_TRANSLATION_API_KEY - 用于翻译的 OpenAI 兼容 API 的密钥。

    BUZZ_MODEL_ROOT - 存储模型文件的根目录。
    默认为 user_cache_dir

    BUZZ_FAVORITE_LANGUAGES - 以逗号分隔的支持语言代码列表,显示在语言列表顶部。

    BUZZ_DOWNLOAD_COOKIEFILE - 用于下载私有视频或绕过反机器人保护的 cookiefile 的位置。

    BUZZ_FORCE_CPU - 强制 Buzz 使用 CPU 而不是 GPU,适用于旧 GPU 较慢或 GPU 有问题的设置。示例用法:BUZZ_FORCE_CPU=true。自 1.2.1 版本起可用。

    BUZZ_MERGE_REGROUP_RULE - 合并带有单词级时间戳的转录时使用的自定义重新分组规则。更多可用选项的信息请参阅 stable-ts 仓库。自 1.3.0 版本起可用。

    - + \ No newline at end of file diff --git a/zh/docs/usage/edit_and_resize.html b/zh/docs/usage/edit_and_resize.html index 60c0f926..79ea54e4 100644 --- a/zh/docs/usage/edit_and_resize.html +++ b/zh/docs/usage/edit_and_resize.html @@ -4,13 +4,13 @@ 编辑与调整 | Buzz - +

    编辑与调整

    当某个音频或视频文件完成转录后,你可以对其进行编辑,并将其导出为不同的字幕格式或纯文本。在转录列表中双击转录内容,即可查看用于编辑和导出的其他选项。

    转录视图界面提供了调整转录内容的选项。点击“调整”按钮,可查看可用的选项。对于在 启用单词级时间戳 设置下生成的转录内容,可以通过指定不同选项(如字幕的最大长度以及是否应在标点处拆分字幕)将其合并成字幕。而对于在 未启用单词级时间戳 设置下生成的转录内容,仅能通过指定所需的字幕最大长度来重新组合。

    如果系统中仍存在音频文件,单词级时间戳合并操作还会分析音频中的静音部分,以提高字幕的准确性。从带有单词级时间戳的转录内容生成字幕的功能自 1.3.0 版本起可用。

    - + \ No newline at end of file diff --git a/zh/docs/usage/file_import.html b/zh/docs/usage/file_import.html index ab572aaf..010249fb 100644 --- a/zh/docs/usage/file_import.html +++ b/zh/docs/usage/file_import.html @@ -4,13 +4,13 @@ 文件导入 | Buzz - +

    文件导入

    若要导入文件:

    • 点击“文件”菜单中的“导入媒体文件”(或者点击工具栏上的“+”图标,也可以使用快捷键 Command/Ctrl + O)。
    • 选择一个音频或视频文件。
    • 选择任务、语言和模型设置。
    • 点击“运行”。
    • 当转录状态显示为“已完成”时,双击该行(或者选中该行后点击“⤢”图标)即可打开转录内容。
    字段选项默认值描述
    导出格式"TXT"、"SRT"、"VTT""TXT"导出文件的格式
    单词级时间戳关闭 / 开启关闭若勾选此项,转录内容将为音频中的每个单词生成单独的字幕行。仅当“导出格式”设置为“SRT”或“VTT”时此选项可用。
    提取语音关闭 / 开启关闭若勾选此项,语音将被提取到单独的音轨中以提高转录准确性。此功能自 1.3.0 版本起可用。

    (有关任务、语言和质量设置的更多信息,请参阅实时录制部分。)

    Buzz 中的媒体文件导入

    - + \ No newline at end of file diff --git a/zh/docs/usage/live_recording.html b/zh/docs/usage/live_recording.html index 16fdbb13..3d078bad 100644 --- a/zh/docs/usage/live_recording.html +++ b/zh/docs/usage/live_recording.html @@ -4,13 +4,13 @@ 实时录制 | Buzz - +

    实时录制

    若要开始实时录制,请按以下步骤操作:

    • 选择录制任务、语言、质量和麦克风。
    • 点击“录制”。

    注意: 使用默认的 Whisper 模型转录音频会占用大量系统资源。若想实现实时性能,可考虑使用 Whisper.cpp Tiny 模型。

    字段选项默认值描述
    任务"转录"、"翻译""转录""转录"会将输入音频转换为所选语言的文本,而"翻译"则会将其转换为英文文本。
    语言完整的支持语言列表请参阅 Whisper 文档"自动检测语言""自动检测语言"会根据音频的前几秒尝试检测其中的语言。不过,如果已知音频语言,建议手动选择,因为在很多情况下这可以提高转录质量。
    质量"极低"、"低"、"中"、"高""极低"转录质量决定了用于转录的 Whisper 模型。"极低"使用"tiny"模型;"低"使用"base"模型;"中"使用"small"模型;"高"使用"medium"模型。模型越大,转录质量越高,但所需的系统资源也越多。更多关于模型的信息请参阅 Whisper 文档
    麦克风[系统可用麦克风][系统默认麦克风]用于录制输入音频的麦克风。

    Buzz 实时录制

    录制电脑播放的音频(macOS)

    若要录制电脑应用程序播放的音频,你可以安装一个音频回环驱动程序(一种可让你创建虚拟音频设备的程序)。本指南后续将介绍在 Mac 上使用 BlackHole 的方法,但你也可以根据自己的操作系统选择其他替代方案(例如 LoopBeAudioLoopBackVirtual Audio Cable)。

    1. 通过 Homebrew 安装 BlackHole

      brew install blackhole-2ch
    2. 通过聚焦搜索(Spotlight)或直接打开 /Applications/Utilities/Audio Midi Setup.app 来启动“音频 MIDI 设置”。

    通过聚焦搜索打开音频MIDI设置

    1. 点击窗口左下角的“+”图标,然后选择“创建多输出设备”。

    创建多输出设备

    1. 将你的默认扬声器和 BlackHole 添加到这个多输出设备中。

    多输出设备截图

    1. 将此多输出设备设置为你的扬声器(可在应用程序内或系统全局进行设置),这样音频就会被输送到 BlackHole 中。

    2. 打开 Buzz 软件,选择 BlackHole 作为录音的麦克风,接着像平常一样进行录制,你就能看到通过 BlackHole 播放的音频的转录文本了。

    录制电脑播放的音频(Windows)

    若要转录系统音频,你需要配置虚拟音频设备,并将你想要转录的应用程序的音频输出连接到该虚拟扬声器。之后,你就可以在 Buzz 中选择它作为音频源。

    1. 安装 [VB CABLE](https://vb - audio.com/Cable/) 作为虚拟音频设备。
    2. 使用 Windows 声音设置进行配置。右键单击系统托盘里的扬声器图标,然后选择“打开声音设置”。在“选择你的输出设备”下拉菜单中,选择“CABLE Input”,将所有系统声音发送到虚拟设备;或者使用“高级声音选项”,选择要将声音输出到该设备的应用程序。

    录制电脑播放的音频(Linux)

    正如 Ubuntu 维基 中所述,在任何使用 PulseAudio 的 Linux 系统上,你可以将应用程序的音频重定向到虚拟扬声器。之后,你可以在 Buzz 中选择它作为音频源。

    总体步骤如下:

    1. 启动会产生你想要转录的声音的应用程序,并开始播放。例如,在媒体播放器中播放视频。
    2. 启动 Buzz 并打开实时录制界面,以便查看设置。
    3. 在 PulseAudio 音量控制(pavucontrol)的“录制”选项卡中,配置从你想要转录声音的应用程序到 Buzz 的声音路由。
    - + \ No newline at end of file diff --git a/zh/docs/usage/speaker_identification.html b/zh/docs/usage/speaker_identification.html index 56a65632..2ef8a0a3 100644 --- a/zh/docs/usage/speaker_identification.html +++ b/zh/docs/usage/speaker_identification.html @@ -4,13 +4,13 @@ Speaker identification | Buzz - +
    -

    Speaker identification

    When transcript of some audio or video file is generated you can identify speakers in the transcript. Double-click the transcript in the list of transcripts to see additional options for editing and exporting.

    Transcription view screen has option to identify speakers. Click on the "Identify speakers" button so see available options.

    If audio file is still present on the system speaker identification will mark each speakers sentences with appropriate label. You can preview 10 seconds of some random sentence of the identified speaker and rename the automatically identified label to speakers real name. If "Merge speaker sentences" checkbox is selected when you save the speaker labels, all consecutive sentences of the same speaker will be merged into one segment. Speaker identification is available since version 1.4.0 on all platforms except Intel macOS.

    - +

    Speaker identification

    When transcript of some audio or video file is generated you can identify speakers in the transcript. Double-click the transcript in the list of transcripts to see additional options for editing and exporting.

    Transcription view screen has option to identify speakers. Click on the "Identify speakers" button so see available options.

    If audio file is still present on the system speaker identification will mark each speakers sentences with appropriate label. You can preview 10 seconds of some random sentence of the identified speaker and rename the automatically identified label to speakers real name. If "Merge speaker sentences" checkbox is selected when you save the speaker labels, all consecutive sentences of the same speaker will be merged into one segment. Speaker identification is not available on Intel macOS.

    + \ No newline at end of file diff --git a/zh/docs/usage/transcription_viewer.html b/zh/docs/usage/transcription_viewer.html index d9a99a2c..72831077 100644 --- a/zh/docs/usage/transcription_viewer.html +++ b/zh/docs/usage/transcription_viewer.html @@ -4,13 +4,13 @@ Transcription Viewer | Buzz - +
    -

    Transcription Viewer

    The Buzz transcription viewer provides a powerful interface for reviewing, editing, and navigating through your transcriptions. This guide covers all the features available in the transcription viewer.

    Overview

    The transcription viewer is organized into several key sections:

    • Top Toolbar: Contains view mode, export, translate, resize, and search
    • Search Bar: Find and navigate through transcript text
    • Transcription Segments: Table view of all transcription segments with timestamps
    • Playback Controls: Audio playback settings and speed controls (since version 1.3.0)
    • Audio Player: Standard media player with progress bar
    • Current Segment Display: Shows the currently selected or playing segment

    Top Toolbar

    View Mode Button

    • Function: Switch between different viewing modes
    • Options:
      • Timestamps: Shows segments in a table format with start/end times
      • Text: Shows combined text without timestamps
      • Translation: Shows translated text (if available)

    Export Button

    • Function: Export transcription in various formats
    • Formats: SRT, VTT, TXT, JSON, and more
    • Usage: Click to open export menu and select desired format

    Translate Button

    • Function: Translate transcription to different languages
    • Usage: Click to open translation settings and start translation

    Resize Button

    • Function: Adjust transcription segment boundaries
    • Usage: Click to open resize dialog for fine-tuning timestamps
    • More information: See Edit and Resize section

    Playback Controls Button

    (since version 1.3.0)

    • Function: Show/hide playback control panel
    • Shortcut: Ctrl+Alt+P (Windows/Linux) or Cmd+Alt+P (macOS)
    • Behavior: Toggle button that shows/hides the playback controls below

    Find Button

    (since version 1.3.0)

    • Function: Show/hide search functionality
    • Shortcut: Ctrl+F (Windows/Linux) or Cmd+F (macOS)
    • Behavior: Toggle button that shows/hides the search bar

    Scroll to Current Button

    (since version 1.3.0)

    • Function: Automatically scroll to the currently playing text
    • Shortcut: Ctrl+G (Windows/Linux) or Cmd+G (macOS)
    • Usage: Click to jump to the current audio position in the transcript

    Search Functionality

    (since version 1.3.0)

    The search bar appears below the toolbar when activated and provides:

    • Search Input: Type text to find in the transcription (wider input field for better usability)
    • Navigation: Up/down arrows to move between matches
    • Status: Shows current match position and total matches (e.g., "3 of 15 matches")
    • Clear: Remove search text and results (larger button for better accessibility)
    • Results: Displays found text with context
    • Consistent Button Sizing: All navigation buttons have uniform height for better visual consistency

    Search Shortcuts

    • Ctrl+F / Cmd+F: Toggle search bar on/off
    • Enter: Find next match
    • Shift+Enter: Find previous match
    • Escape: Close search bar

    Search Features

    • Real-time Search: Results update as you type
    • Case-insensitive: Finds matches regardless of capitalization
    • Word Boundaries: Respects word boundaries for accurate matching
    • Cross-view Search: Works in all view modes (Timestamps, Text, Translation)

    Playback Controls

    (since version 1.3.0)

    Loop Segment

    • Function: Automatically loop playback of selected segments
    • Usage: Check the "Loop Segment" checkbox
    • Behavior: When enabled, clicking on a transcript segment will set a loop range
    • Visual Feedback: Loop range is highlighted in the audio player

    Follow Audio

    • Function: Automatically scroll to current audio position
    • Usage: Check the "Follow Audio" checkbox
    • Behavior: Transcript automatically follows the audio playback
    • Benefits: Easy to follow along with long audio files

    Speed Controls

    • Function: Adjust audio playback speed
    • Range: 0.5x to 2.0x speed
    • Controls:
      • Speed Dropdown: Select from preset speeds or enter custom value
      • Decrease Button (-): Reduce speed by 0.05x increments
      • Increase Button (+): Increase speed by 0.05x increments
    • Persistence: Speed setting is saved between sessions
    • Button Sizing: Speed control buttons match the size of search navigation buttons for visual consistency

    Keyboard Shortcuts

    (since version 1.3.0)

    Audio Playback

    • Ctrl+P / Cmd+P: Play/Pause audio
    • Ctrl+Shift+P / Cmd+Shift+P: Replay current segment from start

    Timestamp Adjustment

    • Ctrl+← / Cmd+←: Decrease segment start time by 0.5s
    • Ctrl+→ / Cmd+→: Increase segment start time by 0.5s
    • Ctrl+Shift+← / Cmd+Shift+←: Decrease segment end time by 0.5s
    • Ctrl+Shift+→ / Cmd+Shift+→: Increase segment end time by 0.5s
    • Ctrl+F / Cmd+F: Toggle search bar
    • Ctrl+Alt+P / Cmd+Alt+P: Toggle playback controls
    • Ctrl+G / Cmd+G: Scroll to current position
    • Ctrl+O / Cmd+O: Open file import dialog
    • Enter: Find next match
    • Shift+Enter: Find previous match
    • Escape: Close search bar
    - +

    Transcription Viewer

    The Buzz transcription viewer provides a powerful interface for reviewing, editing, and navigating through your transcriptions. This guide covers all the features available in the transcription viewer.

    Overview

    The transcription viewer is organized into several key sections:

    • Top Toolbar: Contains view mode, export, translate, resize, and search
    • Search Bar: Find and navigate through transcript text
    • Transcription Segments: Table view of all transcription segments with timestamps
    • Playback Controls: Audio playback settings and speed controls
    • Audio Player: Standard media player with progress bar
    • Current Segment Display: Shows the currently selected or playing segment

    Top Toolbar

    View Mode Button

    • Function: Switch between different viewing modes
    • Options:
      • Timestamps: Shows segments in a table format with start/end times
      • Text: Shows combined text without timestamps
      • Translation: Shows translated text (if available)

    Export Button

    • Function: Export transcription in various formats
    • Formats: SRT, VTT, TXT, JSON, and more
    • Usage: Click to open export menu and select desired format

    Translate Button

    • Function: Translate transcription to different languages
    • Usage: Click to open translation settings and start translation

    Resize Button

    • Function: Adjust transcription segment boundaries
    • Usage: Click to open resize dialog for fine-tuning timestamps
    • More information: See Edit and Resize section

    Playback Controls Button

    • Function: Show/hide playback control panel
    • Shortcut: Ctrl+Alt+P (Windows/Linux) or Cmd+Alt+P (macOS)
    • Behavior: Toggle button that shows/hides the playback controls below

    Find Button

    • Function: Show/hide search functionality
    • Shortcut: Ctrl+F (Windows/Linux) or Cmd+F (macOS)
    • Behavior: Toggle button that shows/hides the search bar

    Scroll to Current Button

    • Function: Automatically scroll to the currently playing text
    • Shortcut: Ctrl+G (Windows/Linux) or Cmd+G (macOS)
    • Usage: Click to jump to the current audio position in the transcript

    Search Functionality

    The search bar appears below the toolbar when activated and provides:

    • Search Input: Type text to find in the transcription (wider input field for better usability)
    • Navigation: Up/down arrows to move between matches
    • Status: Shows current match position and total matches (e.g., "3 of 15 matches")
    • Clear: Remove search text and results (larger button for better accessibility)
    • Results: Displays found text with context
    • Consistent Button Sizing: All navigation buttons have uniform height for better visual consistency

    Search Shortcuts

    • Ctrl+F / Cmd+F: Toggle search bar on/off
    • Enter: Find next match
    • Shift+Enter: Find previous match
    • Escape: Close search bar

    Search Features

    • Real-time Search: Results update as you type
    • Case-insensitive: Finds matches regardless of capitalization
    • Word Boundaries: Respects word boundaries for accurate matching
    • Cross-view Search: Works in all view modes (Timestamps, Text, Translation)

    Playback Controls

    Loop Segment

    • Function: Automatically loop playback of selected segments
    • Usage: Check the "Loop Segment" checkbox
    • Behavior: When enabled, clicking on a transcript segment will set a loop range
    • Visual Feedback: Loop range is highlighted in the audio player

    Follow Audio

    • Function: Automatically scroll to current audio position
    • Usage: Check the "Follow Audio" checkbox
    • Behavior: Transcript automatically follows the audio playback
    • Benefits: Easy to follow along with long audio files

    Speed Controls

    • Function: Adjust audio playback speed
    • Range: 0.5x to 2.0x speed
    • Controls:
      • Speed Dropdown: Select from preset speeds or enter custom value
      • Decrease Button (-): Reduce speed by 0.05x increments
      • Increase Button (+): Increase speed by 0.05x increments
    • Persistence: Speed setting is saved between sessions
    • Button Sizing: Speed control buttons match the size of search navigation buttons for visual consistency

    Keyboard Shortcuts

    Audio Playback

    • Ctrl+P / Cmd+P: Play/Pause audio
    • Ctrl+Shift+P / Cmd+Shift+P: Replay current segment from start

    Timestamp Adjustment

    • Ctrl+← / Cmd+←: Decrease segment start time by 0.5s
    • Ctrl+→ / Cmd+→: Increase segment start time by 0.5s
    • Ctrl+Shift+← / Cmd+Shift+←: Decrease segment end time by 0.5s
    • Ctrl+Shift+→ / Cmd+Shift+→: Increase segment end time by 0.5s
    • Ctrl+F / Cmd+F: Toggle search bar
    • Ctrl+Alt+P / Cmd+Alt+P: Toggle playback controls
    • Ctrl+G / Cmd+G: Scroll to current position
    • Ctrl+O / Cmd+O: Open file import dialog
    • Enter: Find next match
    • Shift+Enter: Find previous match
    • Escape: Close search bar
    + \ No newline at end of file diff --git a/zh/docs/usage/translations.html b/zh/docs/usage/translations.html index 75f22d5d..512d375a 100644 --- a/zh/docs/usage/translations.html +++ b/zh/docs/usage/translations.html @@ -4,13 +4,13 @@ 翻译功能 | Buzz - +

    翻译功能

    默认的“翻译”任务借助 Whisper 模型将内容翻译成英语。从 1.0.0 版本开始,Buzz 支持使用其他人工智能将内容翻译成任意语言。

    若要使用翻译功能,你需要配置 OpenAI API 密钥和翻译设置。在“偏好设置”中设置 OpenAI API 密钥。Buzz 也支持本地运行的、兼容 OpenAI API 的自定义翻译人工智能。有关本地运行人工智能的更多信息,请参阅 ollamaLM Studio。有关可用自定义 API 的信息,请查看这个 讨论线程

    若要为实时录制配置翻译功能,可在实时录制设置的“高级设置”对话框中启用该功能。输入要使用的人工智能模型,并提供给人工智能的翻译指令提示。对于已经完成语音识别的文件,也可以使用翻译功能。在转录查看器工具栏上点击“翻译”按钮即可。

    为了让人工智能知道如何进行翻译,请在“给人工智能的指令”部分输入翻译说明。在说明中,你应该明确指出要将文本翻译成何种语言。此外,由于人工智能往往会添加一些注释或备注,你可能需要额外添加指令禁止其这么做。以下是一个将英语字幕翻译成西班牙语的指令示例:

    你是一位专业翻译人员,擅长将英语翻译成西班牙语。你只需将发给你的每一句话翻译成西班牙语,不要添加任何注释或备注。

    如果你在“偏好设置”中启用了“启用实时录制转录导出”功能,实时文本转录内容在生成和翻译后将被导出到一个文本文件中。这个文件可用于将实时转录内容与其他应用程序(如 OBS Studio)进行进一步集成。

    使用 ChatGPT gpt - 4o 模型对一小时长的音频进行翻译,大致费用约为 0.50 美元。

    - + \ No newline at end of file diff --git a/zh/index.html b/zh/index.html index fb5682f7..76826ef5 100644 --- a/zh/index.html +++ b/zh/index.html @@ -4,13 +4,13 @@ Buzz - +
    - + \ No newline at end of file