Text-to-Speech
English
Chinese
TTS_eval_models / speaker_similarity /pyannote /pyannote_diarization_config.yaml
zhu-han's picture
Upload 6 files
fdc91b8 verified
raw
history blame
828 Bytes
version: 3.1.0
pipeline:
name: pyannote.audio.pipelines.SpeakerDiarization
params:
clustering: AgglomerativeClustering
# embedding: pyannote/wespeaker-voxceleb-resnet34-LM # if you want to use the HF model
embedding: /star-home/zhuhan/model/huggingface/pyannote/pyannote_model_wespeaker-voxceleb-resnet34-LM.bin # if you want to use the local model
embedding_batch_size: 32
embedding_exclude_overlap: true
# segmentation: pyannote/segmentation-3.0 # if you want to use the HF model
segmentation: /star-home/zhuhan/model/huggingface/pyannote/pyannote_model_segmentation-3.0.bin # if you want to use the local model
segmentation_batch_size: 32
params:
clustering:
method: centroid
min_cluster_size: 12
threshold: 0.7045654963945799
segmentation:
min_duration_off: 0.0