fixes bugs

2026-02-19 04:11:36 +03:00 · 2026-02-19 04:11:36 +03:00 · eb08c1fef9
parent de07a045ce
commit eb08c1fef9
3 changed files with 4 additions and 6 deletions
--- a/README.md
+++ b/README.md
@ -5,7 +5,7 @@
 ## Возможности

 - Распознавание речи (faster-whisper, модель large-v3)
- Диаризация спикеров (pyannote.audio 3.1)
+- Диаризация спикеров (pyannote.audio community-1)
 - Поддержка форматов: `.m4a`, `.mp3`, `.wav`, `.aac`
 - Аудио до 3 часов / 2 ГБ
 - Автоматический чанкинг для длинных записей (>30 мин)
@ -38,8 +38,7 @@ HF_TOKEN=hf_your_token_here

 > Для получения токена: https://huggingface.co/settings/tokens
 > Необходимо принять условия использования моделей:
-> - https://huggingface.co/pyannote/speaker-diarization-3.1
-> - https://huggingface.co/pyannote/segmentation-3.0
+> - https://huggingface.co/pyannote/speaker-diarization-community-1

 ## Использование

--- a/requirements.txt
+++ b/requirements.txt
@ -1,5 +1,4 @@
 faster-whisper
 pyannote.audio
 python-dotenv
-pydub
 tqdm
--- a/transcriber/diarization/pyannote_engine.py
+++ b/transcriber/diarization/pyannote_engine.py
@ -23,7 +23,7 @@ class DiarizationEngine:
    def __init__(self, hf_token: str, device: str):
        logger.info("Loading diarization pipeline on %s", device)
        self._pipeline = Pipeline.from_pretrained(
-            "pyannote/speaker-diarization-3.1",
+            "pyannote/speaker-diarization-community-1",
            token=hf_token,
        )
        self._device = torch.device(device)
@ -57,7 +57,7 @@ class DiarizationEngine:
            diarization = self._pipeline(audio_path, hook=hook, **kwargs)

        turns = []
-        for turn, _, speaker in diarization.itertracks(yield_label=True):
+        for turn, speaker in diarization.exclusive_speaker_diarization:
            turns.append(SpeakerTurn(
                start=turn.start,
                end=turn.end,