BUT-FIT
/

diarizen-wavlm-large-s80-mlc

Voice Activity Detection

speaker-diarization

pyannote-audio-pipeline

Model card Files Files and versions

diarizen-wavlm-large-s80-mlc / config.toml

Jyhan003's picture

Remove redundant part

5276400 7 months ago

history blame contribute delete

605 Bytes

	[model]
	path = "diarizen.models.eend.model_wavlm_conformer.Model"

	[model.args]
	wavlm_src = "wavlm_large_s80_md"
	wavlm_layer_num = 25
	wavlm_feat_dim = 1024
	attention_in = 256
	ffn_hidden = 1024
	num_head = 4
	num_layer = 4
	dropout = 0.1
	chunk_size = 8
	use_posi = false
	output_activate_function = false
	selected_channel = 0
	max_speakers_per_chunk = 2

	[inference.args]
	seg_duration = 12
	segmentation_step = 0.1
	batch_size = 32
	apply_median_filtering = true

	[clustering.args]
	method = "AgglomerativeClustering"
	min_speakers = 2
	max_speakers = 2
	ahc_threshold = 0.6647095879538272
	min_cluster_size = 16