Files
pyannote-speaker-diarizatio…/tests/unit/test_diar_config.py
transcrilive 2b1a3c1312 feat: initial public release v0.1.0 — MLX port of pyannote-speaker-diarization-3.1
Byte-parity with pyannote-PyTorch reference (cosine 0.763718 identical
at 6 decimals on 200 cross-window slot pairs). 2.5x faster than
pyannote-MPS on Apple Silicon native.

Extracted from gitea.tavportal.com/olivier/MLX_CONVERTOR commit 5f9eafa.
2026-05-09 16:05:39 +02:00

29 lines
1.0 KiB
Python

from pyannote_diarization_3_1_mlx._config import (
SEG_DURATION, SEG_HOP, SEG_FRAMES, SEG_CLASSES,
MAX_SPEAKERS_PER_CHUNK, MAX_SPEAKERS_PER_FRAME,
EMB_BATCH_SIZE, EMB_EXCLUDE_OVERLAP,
CLUSTER_METHOD, CLUSTER_THRESHOLD, CLUSTER_MIN_SIZE,
SEG_HF_REPO, SEG_HF_REV, EMB_HF_REPO, EMB_HF_REV,
)
def test_pyannote_3_1_locked_hyperparameters():
assert SEG_DURATION == 10.0
assert SEG_HOP == 1.0
assert SEG_FRAMES == 589
assert SEG_CLASSES == 7
assert MAX_SPEAKERS_PER_CHUNK == 3
assert MAX_SPEAKERS_PER_FRAME == 2
assert EMB_BATCH_SIZE == 32
assert EMB_EXCLUDE_OVERLAP is True
assert CLUSTER_METHOD == "centroid"
assert CLUSTER_THRESHOLD == 0.7045654963945799
assert CLUSTER_MIN_SIZE == 12
def test_locked_hf_revisions():
assert SEG_HF_REPO == "mlx-community/pyannote-segmentation-3.0-mlx"
assert SEG_HF_REV == "5189a69b35c5f7e48082a978f3476bac81590874"
assert EMB_HF_REPO == "mlx-community/wespeaker-voxceleb-resnet34-LM"
assert EMB_HF_REV == "97fc9343d2cfd0ae4d1c1d8c299e0046aa502e31"