hicustomer
/

pyannote-speaker-diarization

Automatic Speech Recognition

pyannote-audio-pipeline

speaker-diarization

speaker-change-detection

voice-activity-detection

overlapped-speech-detection

Model card Files Files and versions

Hervé BREDIN commited on Oct 24, 2022

Commit

369ac18

·

1 Parent(s): 89e7168

feat: prepare for pyannote.audio 2.1

Files changed (1) hide show

config.yaml +10 -12

config.yaml CHANGED Viewed

@@ -1,20 +1,18 @@
 pipeline:
   name: pyannote.audio.pipelines.SpeakerDiarization
   params:
-    segmentation: pyannote/segmentation@2022.07
-    segmentation_step: 0.1
-    segmentation_batch_size: 32
-    # embedding: speechbrain/spkrec-ecapa-voxceleb@5c0be3875fda05e81f3c004ed8c7c06be308de1e
     embedding: speechbrain/spkrec-ecapa-voxceleb
-    embedding_exclude_overlap: True
     embedding_batch_size: 32
-    clustering: HiddenMarkovModelClustering
 params:
-  segmentation_onset: 0.58
   clustering:
-    covariance_type: diag
-    threshold: 0.35
-    single_cluster_detection:
-      quantile: 0.05
-      threshold: 1.15

 pipeline:
   name: pyannote.audio.pipelines.SpeakerDiarization
   params:
+    clustering: AgglomerativeClustering
     embedding: speechbrain/spkrec-ecapa-voxceleb
     embedding_batch_size: 32
+    embedding_exclude_overlap: true
+    segmentation: pyannote/segmentation@2022.07
+    segmentation_batch_size: 32
 params:
   clustering:
+    method: centroid
+    min_cluster_size: 15
+    threshold: 0.7153814381597874
+  segmentation:
+    min_duration_off: 0.5817029604921046
+    threshold: 0.4442333667381752