BUT-FIT
/

diarizen-wavlm-large-s80-mlc

Voice Activity Detection

speaker-diarization

pyannote-audio-pipeline

Model card Files Files and versions

Jyhan003 commited on May 6

Commit

c77de77

·

1 Parent(s): 0ff0255

initial commit

Files changed (2) hide show

config.toml +30 -0
pytorch_model.bin +3 -0

config.toml ADDED Viewed

	@@ -0,0 +1,30 @@

+[model]
+path = "diarizen.models.eend.model_wavlm_conformer.Model"
+[model.args]
+wavlm_src = "wavlm_large_s80_md"
+wavlm_layer_num = 25
+wavlm_feat_dim = 1024
+attention_in = 256
+ffn_hidden = 1024
+num_head = 4
+num_layer = 4
+dropout = 0.1
+chunk_size = 8
+use_posi = false
+output_activate_function = false
+selected_channel = 0
+[inference.args]
+seg_duration = 8
+segmentation_step = 0.1
+batch_size = 32
+apply_median_filtering = true
+[clustering.args]
+method = "AgglomerativeClustering"
+min_speakers = 2
+max_speakers = 2
+ahc_threshold = 0.6647095879538272
+min_cluster_size = 16
+min_frames_ratio = 0.1

pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9117101fefd61c74201edac55a47418f9137d6381fcc327db9cb9b780551a93d
+size 278059174