feat: initial public release v0.1.0 — MLX port of pyannote-speaker-diarization-3.1
Byte-parity with pyannote-PyTorch reference (cosine 0.763718 identical at 6 decimals on 200 cross-window slot pairs). 2.5x faster than pyannote-MPS on Apple Silicon native. Extracted from gitea.tavportal.com/olivier/MLX_CONVERTOR commit 5f9eafa.
This commit is contained in:
28
tests/unit/test_diar_config.py
Normal file
28
tests/unit/test_diar_config.py
Normal file
@@ -0,0 +1,28 @@
|
||||
from pyannote_diarization_3_1_mlx._config import (
|
||||
SEG_DURATION, SEG_HOP, SEG_FRAMES, SEG_CLASSES,
|
||||
MAX_SPEAKERS_PER_CHUNK, MAX_SPEAKERS_PER_FRAME,
|
||||
EMB_BATCH_SIZE, EMB_EXCLUDE_OVERLAP,
|
||||
CLUSTER_METHOD, CLUSTER_THRESHOLD, CLUSTER_MIN_SIZE,
|
||||
SEG_HF_REPO, SEG_HF_REV, EMB_HF_REPO, EMB_HF_REV,
|
||||
)
|
||||
|
||||
|
||||
def test_pyannote_3_1_locked_hyperparameters():
|
||||
assert SEG_DURATION == 10.0
|
||||
assert SEG_HOP == 1.0
|
||||
assert SEG_FRAMES == 589
|
||||
assert SEG_CLASSES == 7
|
||||
assert MAX_SPEAKERS_PER_CHUNK == 3
|
||||
assert MAX_SPEAKERS_PER_FRAME == 2
|
||||
assert EMB_BATCH_SIZE == 32
|
||||
assert EMB_EXCLUDE_OVERLAP is True
|
||||
assert CLUSTER_METHOD == "centroid"
|
||||
assert CLUSTER_THRESHOLD == 0.7045654963945799
|
||||
assert CLUSTER_MIN_SIZE == 12
|
||||
|
||||
|
||||
def test_locked_hf_revisions():
|
||||
assert SEG_HF_REPO == "mlx-community/pyannote-segmentation-3.0-mlx"
|
||||
assert SEG_HF_REV == "5189a69b35c5f7e48082a978f3476bac81590874"
|
||||
assert EMB_HF_REPO == "mlx-community/wespeaker-voxceleb-resnet34-LM"
|
||||
assert EMB_HF_REV == "97fc9343d2cfd0ae4d1c1d8c299e0046aa502e31"
|
||||
Reference in New Issue
Block a user