TTS_eval_models / speaker_similarity /pyannote /pyannote_diarization_config.yaml

Upload 6 files

fdc91b8 verified 4 months ago

828 Bytes

	version: 3.1.0

	pipeline:
	name: pyannote.audio.pipelines.SpeakerDiarization
	params:
	clustering: AgglomerativeClustering
	# embedding: pyannote/wespeaker-voxceleb-resnet34-LM # if you want to use the HF model
	embedding: /star-home/zhuhan/model/huggingface/pyannote/pyannote_model_wespeaker-voxceleb-resnet34-LM.bin # if you want to use the local model
	embedding_batch_size: 32
	embedding_exclude_overlap: true
	# segmentation: pyannote/segmentation-3.0 # if you want to use the HF model
	segmentation: /star-home/zhuhan/model/huggingface/pyannote/pyannote_model_segmentation-3.0.bin # if you want to use the local model
	segmentation_batch_size: 32

	params:
	clustering:
	method: centroid
	min_cluster_size: 12
	threshold: 0.7045654963945799
	segmentation:
	min_duration_off: 0.0