diff --git a/speech_service/transcriber.py b/speech_service/transcriber.py index 8d873a1..a68266d 100644 --- a/speech_service/transcriber.py +++ b/speech_service/transcriber.py @@ -12,5 +12,5 @@ class WhisperTranscriber: print("Whisper model loaded.") def transcribe(self, audio_file: str) -> str: - result = self.pipe(audio_file, return_timestamps=True) + result = self.pipe(audio_file, batch_size=4, return_timestamps=True) return result.get("text", "").strip() diff --git a/telegram_bot/handlers/audio_handler.py b/telegram_bot/handlers/audio_handler.py index c25e205..b883e59 100644 --- a/telegram_bot/handlers/audio_handler.py +++ b/telegram_bot/handlers/audio_handler.py @@ -50,6 +50,7 @@ async def handle_voice_and_video(message: types.Message, redis_service, storage_ chat_id=message.chat.id, message_id=message.message_id ) + os.remove(wav_destination) if text: await send_long_message(message, text) else: