74 lines
2.5 KiB
Python
74 lines
2.5 KiB
Python
import os
|
||
import subprocess
|
||
import uuid
|
||
from functools import partial
|
||
from aiogram import types, Dispatcher, F
|
||
|
||
async def handle_voice_and_video(message: types.Message, redis_service, storage_path: str):
|
||
file_id = None
|
||
if message.content_type == types.ContentType.VOICE:
|
||
file_id = message.voice.file_id
|
||
elif message.content_type == types.ContentType.VIDEO_NOTE:
|
||
file_id = message.video_note.file_id
|
||
|
||
if not file_id:
|
||
return
|
||
|
||
file = await message.bot.get_file(file_id)
|
||
file_path = file.file_path
|
||
|
||
file_uuid = str(uuid.uuid4())
|
||
original_filename = os.path.basename(file_path)
|
||
temp_filename = f"{file_uuid}_{original_filename}"
|
||
|
||
os.makedirs(storage_path, exist_ok=True)
|
||
|
||
temp_destination = os.path.join(storage_path, temp_filename)
|
||
|
||
await message.bot.download_file(file_path, temp_destination)
|
||
|
||
wav_filename = f"{file_uuid}.wav"
|
||
wav_destination = os.path.join(storage_path, wav_filename)
|
||
|
||
convert_to_wav(temp_destination, wav_destination)
|
||
|
||
os.remove(temp_destination)
|
||
|
||
task_data = {
|
||
"uuid": file_uuid,
|
||
"file_path": wav_destination,
|
||
"user_id": message.from_user.id,
|
||
"chat_id": message.chat.id,
|
||
"message_id": message.message_id
|
||
}
|
||
|
||
await redis_service.publish_task(task_data)
|
||
await message.reply("Your message has been received, converted to WAV, and queued for processing.\nWaiting for transcription...")
|
||
|
||
text = await redis_service.wait_for_text(
|
||
user_id=message.from_user.id,
|
||
chat_id=message.chat.id,
|
||
message_id=message.message_id
|
||
)
|
||
if text:
|
||
await message.reply(f"Transcription result:\n{text}")
|
||
else:
|
||
await message.reply("Sorry, transcription result was not received within the timeout.")
|
||
|
||
|
||
def convert_to_wav(input_file: str, output_file: str):
|
||
"""
|
||
Конвертирует любой аудиофайл в WAV с частотой 16kHz, 1 канал (моно).
|
||
Логирует ошибки FFmpeg.
|
||
"""
|
||
command = [
|
||
"ffmpeg", "-y", "-i", input_file,
|
||
"-ar", "16000", "-ac", "1", "-c:a", "pcm_s16le",
|
||
output_file
|
||
]
|
||
subprocess.run(command, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
|
||
|
||
def register_audio_handlers(dp: Dispatcher, redis_service, storage_path: str):
|
||
handler_callback = partial(handle_voice_and_video, redis_service=redis_service, storage_path=storage_path)
|
||
dp.message.register(handler_callback, F.content_type.in_({types.ContentType.VOICE, types.ContentType.VIDEO_NOTE}))
|