Spaces:

AlserFurma
/

LipSyncAI

Sleeping

AlserFurma commited on Oct 20, 2025

Commit

2773547

verified ·

1 Parent(s): 0ff6411

Create app.py

Files changed (1) hide show

app.py ADDED Viewed

+import gradio as gr
+import os
+from gtts import gTTS
+import subprocess
+import tempfile
+def generate_video(image, text):
+    if image is None or not text.strip():
+        return "Ошибка: Загрузите фото и введите текст.", None
+    # 1. Создаём временные файлы
+    temp_dir = tempfile.mkdtemp()
+    audio_path = os.path.join(temp_dir, "speech.wav")
+    video_path = os.path.join(temp_dir, "result.mp4")
+    # 2. Генерируем голос из текста (TTS)
+    tts = gTTS(text, lang='en')
+    tts.save(audio_path)
+    # 3. Запускаем Wav2Lip (через консоль)
+    command = f"python Wav2Lip/inference.py --checkpoint_path wav2lip_gan.pth --face '{image}' --audio '{audio_path}' --outfile '{video_path}'"
+    subprocess.run(command, shell=True, check=True)
+    return "Видео готово!", video_path
+iface = gr.Interface(
+    fn=generate_video,
+    inputs=[
+        gr.Image(label="Фото человека"),
+        gr.Textbox(label="Введите текст речи")
+    ],
+    outputs=[
+        gr.Text(label="Статус"),
+        gr.Video(label="Результат")
+    ],
+    title="AI LipSync Generator",
+    description="Загрузи фото и введи текст — программа создаст видео, где человек говорит этот текст."
+)
+iface.launch()