|
[model] |
|
path = "diarizen.models.eend.model_wavlm_conformer.Model" |
|
|
|
[model.args] |
|
wavlm_src = "wavlm_large_s80_md" |
|
wavlm_layer_num = 25 |
|
wavlm_feat_dim = 1024 |
|
attention_in = 256 |
|
ffn_hidden = 1024 |
|
num_head = 4 |
|
num_layer = 4 |
|
dropout = 0.1 |
|
chunk_size = 8 |
|
use_posi = false |
|
output_activate_function = false |
|
selected_channel = 0 |
|
max_speakers_per_chunk = 2 |
|
|
|
[inference.args] |
|
seg_duration = 12 |
|
segmentation_step = 0.1 |
|
batch_size = 32 |
|
apply_median_filtering = true |
|
|
|
[clustering.args] |
|
method = "AgglomerativeClustering" |
|
min_speakers = 2 |
|
max_speakers = 2 |
|
ahc_threshold = 0.6647095879538272 |
|
min_cluster_size = 16 |
|
|