patriotyk commited on
Commit
0123370
·
verified ·
1 Parent(s): e0ee43b

Replace wrong model

Browse files
Files changed (2) hide show
  1. config.yml +8 -6
  2. pytorch_model.bin +2 -2
config.yml CHANGED
@@ -1,5 +1,5 @@
1
 
2
- multispeaker: true
3
 
4
  dim_in: 64
5
  hidden_dim: 512
@@ -15,16 +15,18 @@ dropout: 0.2
15
 
16
  # config for decoder
17
  decoder:
18
- type: 'hifigan' # either hifigan or istftnet
19
  resblock_kernel_sizes: [3,7,11]
20
- upsample_rates : [10,5,3,2]
21
  upsample_initial_channel: 512
22
  resblock_dilation_sizes: [[1,3,5], [1,3,5], [1,3,5]]
23
- upsample_kernel_sizes: [20,10,6,4]
 
 
24
 
25
  # speech language model config
26
  slm:
27
- model: ''
28
  sr: 16000 # sampling rate of SLM
29
  hidden: 768 # hidden size of SLM
30
  nlayers: 13 # number of layers of SLM
@@ -42,7 +44,7 @@ diffusion:
42
 
43
  # diffusion distribution config
44
  dist:
45
- sigma_data: 0.19988229232390187 # placeholder for estimate_sigma_data set to false
46
  estimate_sigma_data: true # estimate sigma_data from the current batch if set to true
47
  mean: -3.0
48
  std: 1.0
 
1
 
2
+ multispeaker: false
3
 
4
  dim_in: 64
5
  hidden_dim: 512
 
15
 
16
  # config for decoder
17
  decoder:
18
+ type: 'istftnet' # either hifigan or istftnet
19
  resblock_kernel_sizes: [3,7,11]
20
+ upsample_rates : [10, 6]
21
  upsample_initial_channel: 512
22
  resblock_dilation_sizes: [[1,3,5], [1,3,5], [1,3,5]]
23
+ upsample_kernel_sizes: [20, 12]
24
+ gen_istft_n_fft: 20
25
+ gen_istft_hop_size: 5
26
 
27
  # speech language model config
28
  slm:
29
+ model: 'openai/whisper-medium'
30
  sr: 16000 # sampling rate of SLM
31
  hidden: 768 # hidden size of SLM
32
  nlayers: 13 # number of layers of SLM
 
44
 
45
  # diffusion distribution config
46
  dist:
47
+ sigma_data: 0.18 # placeholder for estimate_sigma_data set to false
48
  estimate_sigma_data: true # estimate sigma_data from the current batch if set to true
49
  mean: -3.0
50
  std: 1.0
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bfd0e06ecc528d25c5d6371c0a5dbfa742b008d0f83d843738e411efeb03f851
3
- size 766654558
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25e78d882ec4ee5a8a361749004edf6914137760f2be33a71ea24ce22da1a24a
3
+ size 748848243