From ac7596c1836970684b826d6d7cbcc94459cfb299 Mon Sep 17 00:00:00 2001 From: itqop Date: Sun, 23 Feb 2025 23:13:04 +0300 Subject: [PATCH] small fixes --- speech_service/transcriber.py | 2 +- telegram_bot/handlers/audio_handler.py | 1 + 2 files changed, 2 insertions(+), 1 deletion(-) diff --git a/speech_service/transcriber.py b/speech_service/transcriber.py index 8d873a1..a68266d 100644 --- a/speech_service/transcriber.py +++ b/speech_service/transcriber.py @@ -12,5 +12,5 @@ class WhisperTranscriber: print("Whisper model loaded.") def transcribe(self, audio_file: str) -> str: - result = self.pipe(audio_file, return_timestamps=True) + result = self.pipe(audio_file, batch_size=4, return_timestamps=True) return result.get("text", "").strip() diff --git a/telegram_bot/handlers/audio_handler.py b/telegram_bot/handlers/audio_handler.py index c25e205..b883e59 100644 --- a/telegram_bot/handlers/audio_handler.py +++ b/telegram_bot/handlers/audio_handler.py @@ -50,6 +50,7 @@ async def handle_voice_and_video(message: types.Message, redis_service, storage_ chat_id=message.chat.id, message_id=message.message_id ) + os.remove(wav_destination) if text: await send_long_message(message, text) else: