Voice Activity Detection
Transformers
PyTorch
TensorBoard
Safetensors
pyannet
speaker-diarization
speaker-segmentation
Generated from Trainer
pyannote
pyannote.audio
pyannote-audio-model
audio
voice
speech
speaker
speaker-change-detection
overlapped-speech-detection
resegmentation
Inference Endpoints
{ | |
"architectures": [ | |
"SegmentationModel" | |
], | |
"chunk_duration": 10.0, | |
"max_speakers_per_chunk": 3, | |
"max_speakers_per_frame": 2, | |
"min_duration": null, | |
"model_type": "pyannet", | |
"sample_rate": 16000, | |
"torch_dtype": "float32", | |
"transformers_version": "4.40.0", | |
"warm_up": [ | |
0.0, | |
0.0 | |
], | |
"weigh_by_cardinality": false | |
} | |