Spaces:
Paused
Paused
darksakura
commited on
Commit
•
a148559
1
Parent(s):
2b59e57
Upload app.py
Browse files
app.py
CHANGED
@@ -149,8 +149,10 @@ def infer(text, sdp_ratio, noise_scale, noise_scale_w, length_scale, sid, langua
|
|
149 |
|
150 |
|
151 |
def tts_fn(
|
152 |
-
text, speaker, sdp_ratio, noise_scale, noise_scale_w, length_scale,LongSentence
|
153 |
):
|
|
|
|
|
154 |
if not LongSentence:
|
155 |
with torch.no_grad():
|
156 |
audio = infer(
|
@@ -160,7 +162,7 @@ def tts_fn(
|
|
160 |
noise_scale_w=noise_scale_w,
|
161 |
length_scale=length_scale,
|
162 |
sid=speaker,
|
163 |
-
language=
|
164 |
)
|
165 |
torch.cuda.empty_cache()
|
166 |
|
@@ -184,7 +186,7 @@ def tts_fn(
|
|
184 |
noise_scale_w=noise_scale_w,
|
185 |
length_scale=length_scale,
|
186 |
sid=speaker,
|
187 |
-
language=
|
188 |
)
|
189 |
audio_fin.append(audio)
|
190 |
|
@@ -253,10 +255,9 @@ if __name__ == "__main__":
|
|
253 |
_ = net_g.eval()
|
254 |
|
255 |
_ = utils.load_checkpoint(args.model, net_g, None, skip_optimizer=True)
|
256 |
-
|
257 |
speaker_ids = hps.data.spk2id
|
258 |
speakers = list(speaker_ids.keys())
|
259 |
-
languages = ["ZH", "JP"]
|
260 |
with gr.Blocks() as app:
|
261 |
|
262 |
gr.Markdown(
|
@@ -304,6 +305,9 @@ if __name__ == "__main__":
|
|
304 |
speaker = gr.Dropdown(
|
305 |
choices=speakers, value=name, label="说话人(在这选择说话人将保留输入文本)"
|
306 |
)
|
|
|
|
|
|
|
307 |
btn.click(
|
308 |
tts_fn,
|
309 |
inputs=[
|
@@ -314,6 +318,7 @@ if __name__ == "__main__":
|
|
314 |
noise_scale_w,
|
315 |
length_scale,
|
316 |
LongSentence,
|
|
|
317 |
],
|
318 |
outputs=[audio_output],
|
319 |
)
|
|
|
149 |
|
150 |
|
151 |
def tts_fn(
|
152 |
+
text, speaker, sdp_ratio, noise_scale, noise_scale_w, length_scale,LongSentence,correct_language
|
153 |
):
|
154 |
+
if correct_language = "Auto":
|
155 |
+
correct_language = "JP" if is_japanese(text) else "ZH"
|
156 |
if not LongSentence:
|
157 |
with torch.no_grad():
|
158 |
audio = infer(
|
|
|
162 |
noise_scale_w=noise_scale_w,
|
163 |
length_scale=length_scale,
|
164 |
sid=speaker,
|
165 |
+
language= correct_language,
|
166 |
)
|
167 |
torch.cuda.empty_cache()
|
168 |
|
|
|
186 |
noise_scale_w=noise_scale_w,
|
187 |
length_scale=length_scale,
|
188 |
sid=speaker,
|
189 |
+
language= correct_language,
|
190 |
)
|
191 |
audio_fin.append(audio)
|
192 |
|
|
|
255 |
_ = net_g.eval()
|
256 |
|
257 |
_ = utils.load_checkpoint(args.model, net_g, None, skip_optimizer=True)
|
|
|
258 |
speaker_ids = hps.data.spk2id
|
259 |
speakers = list(speaker_ids.keys())
|
260 |
+
languages = ["Auto","ZH", "JP"]
|
261 |
with gr.Blocks() as app:
|
262 |
|
263 |
gr.Markdown(
|
|
|
305 |
speaker = gr.Dropdown(
|
306 |
choices=speakers, value=name, label="说话人(在这选择说话人将保留输入文本)"
|
307 |
)
|
308 |
+
correct_language = gr.Dropdown(
|
309 |
+
choices=languages, value=languages[0], label="Language(如果发生报错请手动指定)"
|
310 |
+
)
|
311 |
btn.click(
|
312 |
tts_fn,
|
313 |
inputs=[
|
|
|
318 |
noise_scale_w,
|
319 |
length_scale,
|
320 |
LongSentence,
|
321 |
+
correct_language,
|
322 |
],
|
323 |
outputs=[audio_output],
|
324 |
)
|