| [model] | |
| path = "diarizen.models.eend.model_wavlm_conformer.Model" | |
| [model.args] | |
| wavlm_src = "wavlm_large_s80_md" | |
| wavlm_layer_num = 25 | |
| wavlm_feat_dim = 1024 | |
| attention_in = 256 | |
| ffn_hidden = 1024 | |
| num_head = 4 | |
| num_layer = 4 | |
| dropout = 0.1 | |
| chunk_size = 8 | |
| use_posi = false | |
| output_activate_function = false | |
| selected_channel = 0 | |
| max_speakers_per_chunk = 2 | |
| [inference.args] | |
| seg_duration = 12 | |
| segmentation_step = 0.1 | |
| batch_size = 32 | |
| apply_median_filtering = true | |
| [clustering.args] | |
| method = "AgglomerativeClustering" | |
| min_speakers = 2 | |
| max_speakers = 2 | |
| ahc_threshold = 0.6647095879538272 | |
| min_cluster_size = 16 | |