Spaces:
Running
Running
darksakura
commited on
Commit
•
51d483c
1
Parent(s):
e8ed104
Upload config.json
Browse files- configs/config.json +16 -10
configs/config.json
CHANGED
@@ -1,17 +1,18 @@
|
|
1 |
{
|
2 |
"train": {
|
3 |
-
"log_interval":
|
4 |
-
"eval_interval":
|
5 |
"seed": 1234,
|
6 |
"epochs": 10000,
|
7 |
-
"learning_rate": 0.
|
8 |
"betas": [
|
9 |
0.8,
|
10 |
0.99
|
11 |
],
|
12 |
"eps": 1e-09,
|
13 |
-
"batch_size":
|
14 |
"fp16_run": false,
|
|
|
15 |
"lr_decay": 0.999875,
|
16 |
"segment_size": 10240,
|
17 |
"init_lr_ratio": 1,
|
@@ -21,7 +22,7 @@
|
|
21 |
"use_sr": true,
|
22 |
"max_speclen": 512,
|
23 |
"port": "8001",
|
24 |
-
"keep_ckpts":
|
25 |
"all_in_mem": false,
|
26 |
"vol_aug": true
|
27 |
},
|
@@ -35,7 +36,8 @@
|
|
35 |
"win_length": 2048,
|
36 |
"n_mel_channels": 80,
|
37 |
"mel_fmin": 0.0,
|
38 |
-
"mel_fmax": 22050
|
|
|
39 |
},
|
40 |
"model": {
|
41 |
"inter_channels": 192,
|
@@ -84,13 +86,18 @@
|
|
84 |
4
|
85 |
],
|
86 |
"n_layers_q": 3,
|
|
|
87 |
"use_spectral_norm": false,
|
88 |
"gin_channels": 768,
|
89 |
"ssl_dim": 768,
|
90 |
-
"n_speakers":
|
|
|
91 |
"speech_encoder": "vec768l12",
|
92 |
"speaker_embedding": false,
|
93 |
-
"vol_embedding": true
|
|
|
|
|
|
|
94 |
},
|
95 |
"spk": {
|
96 |
"AKIMOTO_MANATSU": 0,
|
@@ -153,7 +160,6 @@
|
|
153 |
"WATANABE_MIRIA": 57,
|
154 |
"YAKUBO_MIO": 58,
|
155 |
"YAMASHITA_MIZUKI": 59,
|
156 |
-
"
|
157 |
-
"YODA_YUUKI": 61
|
158 |
}
|
159 |
}
|
|
|
1 |
{
|
2 |
"train": {
|
3 |
+
"log_interval": 1000,
|
4 |
+
"eval_interval": 2000,
|
5 |
"seed": 1234,
|
6 |
"epochs": 10000,
|
7 |
+
"learning_rate": 0.00015,
|
8 |
"betas": [
|
9 |
0.8,
|
10 |
0.99
|
11 |
],
|
12 |
"eps": 1e-09,
|
13 |
+
"batch_size": 5,
|
14 |
"fp16_run": false,
|
15 |
+
"half_type": "fp16",
|
16 |
"lr_decay": 0.999875,
|
17 |
"segment_size": 10240,
|
18 |
"init_lr_ratio": 1,
|
|
|
22 |
"use_sr": true,
|
23 |
"max_speclen": 512,
|
24 |
"port": "8001",
|
25 |
+
"keep_ckpts": 50,
|
26 |
"all_in_mem": false,
|
27 |
"vol_aug": true
|
28 |
},
|
|
|
36 |
"win_length": 2048,
|
37 |
"n_mel_channels": 80,
|
38 |
"mel_fmin": 0.0,
|
39 |
+
"mel_fmax": 22050,
|
40 |
+
"unit_interpolate_mode": "nearest"
|
41 |
},
|
42 |
"model": {
|
43 |
"inter_channels": 192,
|
|
|
86 |
4
|
87 |
],
|
88 |
"n_layers_q": 3,
|
89 |
+
"n_flow_layer": 4,
|
90 |
"use_spectral_norm": false,
|
91 |
"gin_channels": 768,
|
92 |
"ssl_dim": 768,
|
93 |
+
"n_speakers": 61,
|
94 |
+
"vocoder_name": "nsf-hifigan",
|
95 |
"speech_encoder": "vec768l12",
|
96 |
"speaker_embedding": false,
|
97 |
+
"vol_embedding": true,
|
98 |
+
"use_depthwise_conv": false,
|
99 |
+
"flow_share_parameter": false,
|
100 |
+
"use_automatic_f0_prediction": true
|
101 |
},
|
102 |
"spk": {
|
103 |
"AKIMOTO_MANATSU": 0,
|
|
|
160 |
"WATANABE_MIRIA": 57,
|
161 |
"YAKUBO_MIO": 58,
|
162 |
"YAMASHITA_MIZUKI": 59,
|
163 |
+
"YODA_YUUKI": 60
|
|
|
164 |
}
|
165 |
}
|