Spaces:
Running
Running
jhj0517
commited on
Commit
•
fbcbf8a
1
Parent(s):
d11cbce
Add UVR BGM separation
Browse files
app.py
CHANGED
@@ -48,6 +48,7 @@ class App:
|
|
48 |
whisper_params = self.default_params["whisper"]
|
49 |
vad_params = self.default_params["vad"]
|
50 |
diarization_params = self.default_params["diarization"]
|
|
|
51 |
|
52 |
with gr.Row():
|
53 |
dd_model = gr.Dropdown(choices=self.whisper_inf.available_models, value=whisper_params["model_size"],
|
@@ -150,6 +151,17 @@ class App:
|
|
150 |
nb_speech_pad_ms = gr.Number(label="Speech Padding (ms)", precision=0, value=vad_params["speech_pad_ms"],
|
151 |
info="Final speech chunks are padded by this time each side")
|
152 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
153 |
with gr.Accordion("Diarization", open=False):
|
154 |
cb_diarize = gr.Checkbox(label="Enable Diarization", value=diarization_params["is_diarize"])
|
155 |
tb_hf_token = gr.Text(label="HuggingFace Token", value=diarization_params["hf_token"],
|
@@ -179,7 +191,9 @@ class App:
|
|
179 |
hallucination_silence_threshold=nb_hallucination_silence_threshold, hotwords=tb_hotwords,
|
180 |
language_detection_threshold=nb_language_detection_threshold,
|
181 |
language_detection_segments=nb_language_detection_segments,
|
182 |
-
prompt_reset_on_temperature=sld_prompt_reset_on_temperature
|
|
|
|
|
183 |
),
|
184 |
dd_file_format,
|
185 |
cb_timestamp
|
|
|
48 |
whisper_params = self.default_params["whisper"]
|
49 |
vad_params = self.default_params["vad"]
|
50 |
diarization_params = self.default_params["diarization"]
|
51 |
+
uvr_params = self.default_params["bgm-separation"]
|
52 |
|
53 |
with gr.Row():
|
54 |
dd_model = gr.Dropdown(choices=self.whisper_inf.available_models, value=whisper_params["model_size"],
|
|
|
151 |
nb_speech_pad_ms = gr.Number(label="Speech Padding (ms)", precision=0, value=vad_params["speech_pad_ms"],
|
152 |
info="Final speech chunks are padded by this time each side")
|
153 |
|
154 |
+
with gr.Accordion("BGM Separation", open=False):
|
155 |
+
cb_bgm_separation = gr.Checkbox(label="Enable BGM separation", value=uvr_params["is_separate_bgm"],
|
156 |
+
interactive=True)
|
157 |
+
dd_uvr_device = gr.Dropdown(label="Device", value=self.music_separator.device,
|
158 |
+
choices=self.music_separator.available_devices)
|
159 |
+
dd_uvr_model_size = gr.Dropdown(label="Model", value=uvr_params["model_size"],
|
160 |
+
choices=self.music_separator.available_models)
|
161 |
+
nb_uvr_segment_size = gr.Number(label="Segment Size", value=uvr_params["segment_size"], precision=0)
|
162 |
+
cb_uvr_save_file = gr.Checkbox(label="Save Separated Files to Output Directory",
|
163 |
+
value=uvr_params["save_file"], interactive=True)
|
164 |
+
|
165 |
with gr.Accordion("Diarization", open=False):
|
166 |
cb_diarize = gr.Checkbox(label="Enable Diarization", value=diarization_params["is_diarize"])
|
167 |
tb_hf_token = gr.Text(label="HuggingFace Token", value=diarization_params["hf_token"],
|
|
|
191 |
hallucination_silence_threshold=nb_hallucination_silence_threshold, hotwords=tb_hotwords,
|
192 |
language_detection_threshold=nb_language_detection_threshold,
|
193 |
language_detection_segments=nb_language_detection_segments,
|
194 |
+
prompt_reset_on_temperature=sld_prompt_reset_on_temperature, is_bgm_separate=cb_bgm_separation,
|
195 |
+
uvr_device=dd_uvr_device, uvr_model_size=dd_uvr_model_size, uvr_segment_size=nb_uvr_segment_size,
|
196 |
+
uvr_save_file=cb_uvr_save_file
|
197 |
),
|
198 |
dd_file_format,
|
199 |
cb_timestamp
|