Upload 4 files
Browse files- CKPT.yaml +14 -0
- generator.ckpt +3 -0
- hyperparams.yaml +45 -0
- kmeans.ckpt +3 -0
CKPT.yaml
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# yamllint disable
|
2 |
+
D_loss: 2.1025607585906982
|
3 |
+
D_mse_gan_fake_loss: 0.1479564905166626
|
4 |
+
D_mse_gan_loss: 2.1025607585906982
|
5 |
+
D_mse_gan_real_loss: 0.03515475243330002
|
6 |
+
G_adv_loss: 5.534212112426758
|
7 |
+
G_feat_match_loss: 0.12056709825992584
|
8 |
+
G_gen_loss: 32.30398178100586
|
9 |
+
G_l1_spec_loss: 0.7178663015365601
|
10 |
+
G_loss: 37.83819580078125
|
11 |
+
G_mse_fake_loss: 4.328541278839111
|
12 |
+
end-of-epoch: true
|
13 |
+
epoch: 200
|
14 |
+
unixtime: 1690560231.9180694
|
generator.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05e5ebcb88438a335eed3e8f6d50cf91df80204d501dd20c3b11b36f81938719
|
3 |
+
size 53587561
|
hyperparams.yaml
ADDED
@@ -0,0 +1,45 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
num_embeddings: 100
|
2 |
+
embedding_dim: 128
|
3 |
+
|
4 |
+
in_channels: 128
|
5 |
+
out_channels: 1
|
6 |
+
resblock_type: "1"
|
7 |
+
resblock_dilation_sizes: [[1, 3, 5], [1, 3, 5], [1, 3, 5]]
|
8 |
+
resblock_kernel_sizes: [3, 7, 11]
|
9 |
+
upsample_kernel_sizes: [11, 8, 8, 4, 4]
|
10 |
+
upsample_initial_channel: 512
|
11 |
+
upsample_factors: [5, 4, 4, 2, 2]
|
12 |
+
inference_padding: 5
|
13 |
+
cond_channels: 0
|
14 |
+
conv_post_bias: True
|
15 |
+
|
16 |
+
var_pred_hidden_dim: 128
|
17 |
+
var_pred_kernel_size: 3
|
18 |
+
var_pred_dropout: 0.5
|
19 |
+
dur_prediction_weight: 1.0
|
20 |
+
|
21 |
+
generator: !new:speechbrain.lobes.models.HifiGAN.UnitHifiganGenerator
|
22 |
+
in_channels: !ref <in_channels>
|
23 |
+
out_channels: !ref <out_channels>
|
24 |
+
resblock_type: !ref <resblock_type>
|
25 |
+
resblock_dilation_sizes: !ref <resblock_dilation_sizes>
|
26 |
+
resblock_kernel_sizes: !ref <resblock_kernel_sizes>
|
27 |
+
upsample_kernel_sizes: !ref <upsample_kernel_sizes>
|
28 |
+
upsample_initial_channel: !ref <upsample_initial_channel>
|
29 |
+
upsample_factors: !ref <upsample_factors>
|
30 |
+
inference_padding: !ref <inference_padding>
|
31 |
+
cond_channels: !ref <cond_channels>
|
32 |
+
conv_post_bias: !ref <conv_post_bias>
|
33 |
+
num_embeddings: !ref <num_embeddings>
|
34 |
+
embedding_dim: !ref <embedding_dim>
|
35 |
+
duration_predictor: True
|
36 |
+
var_pred_hidden_dim: !ref <var_pred_hidden_dim>
|
37 |
+
var_pred_kernel_size: !ref <var_pred_kernel_size>
|
38 |
+
var_pred_dropout: !ref <var_pred_dropout>
|
39 |
+
|
40 |
+
modules:
|
41 |
+
generator: !ref <generator>
|
42 |
+
|
43 |
+
pretrainer: !new:speechbrain.utils.parameter_transfer.Pretrainer
|
44 |
+
loadables:
|
45 |
+
generator: !ref <generator>
|
kmeans.ckpt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba586956416308b3cfca603db971149ffe53785dbeca1ec20139997a4ee37aa3
|
3 |
+
size 3747083
|