File size: 2,558 Bytes
fdb9167 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 |
allow_cache: true
batch_max_steps: 8192
batch_max_steps_valid: 8192
batch_size: 32
config: ./TensorFlowTTS/examples/multiband_melgan_hf/conf/multiband_melgan_hf.sw.v2.yml
dev_dir: ./dump/valid/
discriminator_mixed_precision: false
discriminator_optimizer_params:
amsgrad: false
lr_fn: PiecewiseConstantDecay
lr_params:
boundaries:
- 100000
- 200000
- 300000
- 400000
- 500000
values:
- 0.00025
- 0.000125
- 6.25e-05
- 3.125e-05
- 1.5625e-05
- 1.0e-06
discriminator_train_start_steps: 200000
eval_batch_size: 16
eval_interval_steps: 5000
format: npy
generator_mixed_precision: false
generator_optimizer_params:
amsgrad: false
lr_fn: PiecewiseConstantDecay
lr_params:
boundaries:
- 100000
- 150000
- 400000
- 500000
- 600000
- 700000
values:
- 0.0005
- 0.00025
- 0.000125
- 6.25e-05
- 3.125e-05
- 1.5625e-05
- 1.0e-06
gradient_accumulation_steps: 1
hifigan_discriminator_params:
filter_scales: 4
filters: 8
is_weight_norm: false
kernel_size: 5
max_filters: 512
n_layers: 5
out_channels: 1
period_scales:
- 3
- 5
- 7
- 11
- 17
- 23
- 37
strides: 3
hop_size: 512
is_shuffle: true
lambda_adv: 2.5
lambda_feat_match: 10.0
log_interval_steps: 200
model_type: multiband_melgan_generator
multiband_melgan_discriminator_params:
downsample_pooling: AveragePooling1D
downsample_pooling_params:
pool_size: 4
strides: 2
downsample_scales:
- 4
- 4
- 4
filters: 16
is_weight_norm: false
kernel_sizes:
- 5
- 3
max_downsample_filters: 512
nonlinear_activation: LeakyReLU
nonlinear_activation_params:
alpha: 0.2
out_channels: 1
scales: 3
multiband_melgan_generator_params:
filters: 384
is_weight_norm: false
kernel_size: 7
out_channels: 4
stack_kernel_size: 3
stacks: 4
upsample_scales:
- 8
- 4
- 4
num_save_intermediate_results: 1
outdir: ./mb-melgan-hifi-sw-tz-victoria-ft-vocab-exp-synth-v2/
postnets: true
pretrained: ''
remove_short_samples: true
resume: ./mb-melgan-hifi-sw-tz-victoria-ft-vocab-exp-synth-v2/checkpoints/ckpt-200000
sampling_rate: 44100
save_interval_steps: 20000
stft_loss_params:
fft_lengths:
- 1024
- 2048
- 512
frame_lengths:
- 600
- 1200
- 240
frame_steps:
- 120
- 240
- 50
subband_stft_loss_params:
fft_lengths:
- 384
- 683
- 171
frame_lengths:
- 150
- 300
- 60
frame_steps:
- 30
- 60
- 10
train_dir: ./dump/train/
train_max_steps: 1000000
use_norm: true
verbose: 1
version: '0.0'
|