Spaces:

AlserFurma
/

LipSyncAI

Sleeping

App Files Files Community

AlserFurma commited on Dec 1, 2025

Commit

670074b

verified ·

1 Parent(s): 94b627a

Update app.py

Browse files

Files changed (1) hide show

app.py +238 -252

app.py CHANGED Viewed

@@ -4,96 +4,78 @@ from PIL import Image
 import tempfile
 from gradio_client import Client, handle_file
 import torch
-from transformers import VitsModel, AutoTokenizer, pipeline, T5Tokenizer, T5ForConditionalGeneration
 import scipy.io.wavfile as wavfile
 import traceback
 import base64
-import nltk
 import random
-# Инициализация NLTK
-try:
-    nltk.data.find('tokenizers/punkt')
-except LookupError:
-    nltk.download('punkt', quiet=True)
-from nltk.tokenize import sent_tokenize
-# Глобальные переменные для моделей
-device = "cuda" if torch.cuda.is_available() else "cpu"
-print(f"Using device: {device}")
 tts_model = None
 tts_tokenizer = None
-translator = None
-qg_tokenizer = None
-qg_model = None
-qa_pipeline = None
 TALKING_HEAD_SPACE = "Skywork/skyreels-a1-talking-head"
-def load_models():
-    """Ленивая загрузка моделей при первом использовании"""
-    global tts_model, tts_tokenizer, translator, qg_tokenizer, qg_model, qa_pipeline
-    try:
-        if tts_model is None:
-            print("Загрузка TTS модели...")
-            tts_model = VitsModel.from_pretrained("facebook/mms-tts-kaz").to(device)
-            tts_tokenizer = AutoTokenizer.from_pretrained("facebook/mms-tts-kaz")
-            print("✓ TTS модель загружена")
-        if translator is None:
-            print("Загрузка модели перевода (это может занять минуту)...")
-            # Используем более легкую модель
-            translator = pipeline(
-                "translation",
-                model="Helsinki-NLP/opus-mt-ru-en",  # Только ru->en
-                device=device
-            )
-            print("✓ Модель перевода загружена")
-        return True
-    except Exception as e:
-        print(f"Ошибка загрузки базовых моделей: {str(e)}")
-        traceback.print_exc()
-        return False
-def load_qa_models():
-    """Загрузка моделей для интерактивного урока"""
-    global qg_tokenizer, qg_model, qa_pipeline
-    try:
-        if qg_tokenizer is None:
-            print("Загрузка QG модели...")
-            qg_tokenizer = T5Tokenizer.from_pretrained("iarfmoose/t5-base-question-generator", legacy=False)
-            qg_model = T5ForConditionalGeneration.from_pretrained("iarfmoose/t5-base-question-generator").to(device)
-            print("✓ QG модель загружена")
-        if qa_pipeline is None:
-            print("Загрузка QA модели...")
-            qa_pipeline = pipeline("question-answering", model="deepset/roberta-base-squad2", device=device)
-            print("✓ QA модель загружена")
-        return True
-    except Exception as e:
-        print(f"Ошибка загрузки QA моделей: {str(e)}")
-        traceback.print_exc()
-        return False
-def translate_ru_to_kk(text):
-    """Упрощенный перевод через английский"""
-    try:
-        # ru -> en
-        en_result = translator(text, max_length=512)[0]['translation_text']
-        # Простая транслитерация для казахского (заглушка)
-        # В реальности нужна модель en->kk, но для демо используем транслит
-        kk_text = en_result  # Временно оставляем на английском
-        return kk_text
-    except Exception as e:
-        print(f"Ошибка перевода: {e}")
-        return text  # Возвращаем исходный текст
 def inference(image: Image.Image, text: str):
     error_msg = ""
@@ -102,37 +84,45 @@ def inference(image: Image.Image, text: str):
     img_path = None
     try:
-        # Загрузка моделей при первом запуске
-        if not load_models():
-            raise RuntimeError("Не удалось загрузить модели")
         # Валидация
         if image is None:
             raise ValueError("Загрузите изображение лектора!")
         if not text or not text.strip():
-            raise ValueError("Введите текст лекции на русском!")
         if len(text) > 500:
-            raise ValueError("Текст слишком длинный! Используйте до 500 символов.")
-        print(f"Входной текст (ru): '{text[:50]}...'")
-        # Перевод на казахский
-        translated_text = translate_ru_to_kk(text)
         print(f"Переведенный текст: '{translated_text[:50]}...'")
-        # Генерация аудио
-        torch.manual_seed(42)
-        inputs = tts_tokenizer(translated_text, return_tensors="pt").to(device)
         with torch.no_grad():
             output = tts_model(**inputs)
             waveform = output.waveform.squeeze().cpu().numpy()
         if waveform.size == 0:
             raise ValueError("TTS сгенерировал пустое аудио!")
         audio = (waveform * 32767).astype("int16")
         sampling_rate = tts_model.config.sampling_rate
@@ -140,26 +130,36 @@ def inference(image: Image.Image, text: str):
             wavfile.write(audio_file.name, sampling_rate, audio)
             audio_path = audio_file.name
-        print(f"Аудио сохранено: {audio_path}")
-        # Сохранение изображения
         with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as img_file:
-            if image.mode != 'RGB':
-                image = image.convert('RGB')
-            image.save(img_file.name, format='PNG')
             img_path = img_file.name
-        print(f"Изображение сохранено: {img_path}")
-        # Вызов talking-head API
         print(f"Подключение к {TALKING_HEAD_SPACE}...")
-        client = Client(TALKING_HEAD_SPACE)
         result = client.predict(
             image_path=handle_file(img_path),
             audio_path=handle_file(audio_path),
-            guidance_scale=3.0,
-            steps=10,
             api_name="/process_image_audio"
         )
@@ -180,15 +180,16 @@ def inference(image: Image.Image, text: str):
         if not video_path or not os.path.exists(video_path):
             raise ValueError("Видео не сгенерировано!")
-        print(f"Видео сгенерировано: {video_path}")
         error_msg = "✅ Бейне сәтті жасалды!"
     except Exception as e:
-        error_msg = f"❌ Ошибка: {str(e)}"
         print(f"ОШИБКА: {error_msg}")
         traceback.print_exc()
     finally:
         for path in [audio_path, img_path]:
             if path and os.path.exists(path):
                 try:
@@ -199,204 +200,185 @@ def inference(image: Image.Image, text: str):
     return video_path, error_msg
 def generate_interactive_lesson(text, video_path):
     try:
-        # Загрузка QA моделей
-        if not load_qa_models():
-            return "<p style='color: red;'>❌ Не удалось загрузить модели для генерации вопросов</p>"
         if not video_path or not os.path.exists(video_path):
-            return "<p style='color: red;'>❌ Сначала сгенерируйте видео!</p>"
-        # Перевод на английский
-        english_text = translator(text, max_length=512)[0]['translation_text']
-        print(f"English text: {english_text[:100]}...")
-        # Генерация вопросов
-        sentences = sent_tokenize(english_text)[:3]
         questions = []
         for i, sent in enumerate(sentences):
             if len(sent) < 10:
                 continue
-            try:
-                # Генерация вопроса
-                qg_input = f"generate question: {sent}"
-                input_ids = qg_tokenizer.encode(qg_input, return_tensors="pt", max_length=512, truncation=True).to(device)
-                with torch.no_grad():
-                    outputs = qg_model.generate(input_ids, max_length=64, num_beams=4)
-                question_en = qg_tokenizer.decode(outputs[0], skip_special_tokens=True)
-                if not question_en or len(question_en) < 5:
-                    question_en = f"What is mentioned about {sent.split()[0]}?"
-                print(f"Q{i+1}: {question_en}")
-                # Извлечение ответа
-                try:
-                    qa_result = qa_pipeline(question=question_en, context=english_text)
-                    correct_answer_en = qa_result['answer']
-                except:
-                    correct_answer_en = sent.split()[0:5]
-                    correct_answer_en = " ".join(correct_answer_en)
-                # Неправильный ответ
-                wrong_options = ["Not mentioned", "Unknown", "Incorrect answer"]
-                wrong_answer_en = random.choice(wrong_options)
-                questions.append({
-                    "question": question_en,
-                    "correct": correct_answer_en,
-                    "wrong": wrong_answer_en
-                })
-            except Exception as e:
-                print(f"Ошибка генерации вопроса {i+1}: {e}")
                 continue
         if not questions:
-            return "<p style='color: orange;'>⚠️ Не удалось сгенерировать вопросы. Текст слишком короткий?</p>"
-        # Base64 видео
         with open(video_path, 'rb') as f:
-            video_base64 = base64.b64encode(f.read()).decode('utf-8')
-        # HTML
         html = f"""<!DOCTYPE html>
-        <html>
-        <head>
-            <meta charset="UTF-8">
-            <title>Interactive Lesson</title>
-            <style>
-                body {{ font-family: Arial, sans-serif; max-width: 900px; margin: 20px auto; padding: 20px; background: #f0f0f0; }}
-                h1 {{ color: #2c3e50; text-align: center; }}
-                video {{ width: 100%; max-width: 700px; display: block; margin: 20px auto; border-radius: 10px; box-shadow: 0 4px 6px rgba(0,0,0,0.1); }}
-                .lecture-text {{ background: white; padding: 20px; border-radius: 10px; margin: 20px 0; box-shadow: 0 2px 4px rgba(0,0,0,0.1); }}
-                .question {{ background: white; padding: 20px; margin: 20px 0; border-radius: 10px; box-shadow: 0 2px 4px rgba(0,0,0,0.1); border-left: 4px solid #3498db; }}
-                button {{ background: #3498db; color: white; padding: 12px 24px; border: none; border-radius: 6px; cursor: pointer; font-size: 14px; margin-top: 10px; }}
-                button:hover {{ background: #2980b9; }}
-                .feedback {{ margin-top: 15px; padding: 10px; border-radius: 5px; font-weight: bold; }}
-                label {{ margin-left: 8px; cursor: pointer; }}
-                input[type="radio"] {{ cursor: pointer; }}
-            </style>
-        </head>
-        <body>
-            <h1>📚 Interactive Lesson</h1>
-            <video controls>
-                <source src="data:video/mp4;base64,{video_base64}" type="video/mp4">
-            </video>
-            <div class="lecture-text">
-                <h3>📝 Lecture Text:</h3>
-                <p>{text.replace(chr(10), '<br>')}</p>
-            </div>
-            <h2 style="color: #2c3e50; text-align: center;">Test Your Knowledge:</h2>
-        """
         for i, q in enumerate(questions):
-            correct_escaped = q['correct'].replace("'", "\\'").replace('"', '\\"')
             html += f"""
-            <div class="question">
-                <p><strong>Question {i+1}:</strong> {q['question']}</p>
-                <div style="margin: 15px 0;">
-                    <input type="radio" name="q{i}" value="correct" id="correct{i}">
-                    <label for="correct{i}">{q['correct']}</label><br><br>
-                    <input type="radio" name="q{i}" value="wrong" id="wrong{i}">
-                    <label for="wrong{i}">{q['wrong']}</label>
-                </div>
-                <button onclick="checkAnswer({i}, '{correct_escaped}')">Check Answer</button>
-                <div class="feedback" id="feedback{i}"></div>
-            </div>
-            """
         html += """
-            <script>
-            function checkAnswer(i, correct) {
-                var selected = document.querySelector('input[name="q' + i + '"]:checked');
-                var feedback = document.getElementById('feedback' + i);
-                if (selected) {
-                    if (selected.value === 'correct') {
-                        feedback.innerHTML = '✅ Correct!';
-                        feedback.style.background = '#d4edda';
-                        feedback.style.color = '#155724';
-                    } else {
-                        feedback.innerHTML = '❌ Wrong. Correct answer: ' + correct;
-                        feedback.style.background = '#f8d7da';
-                        feedback.style.color = '#721c24';
-                    }
-                } else {
-                    feedback.innerHTML = '⚠️ Please select an answer!';
-                    feedback.style.background = '#fff3cd';
-                    feedback.style.color = '#856404';
-                }
-            }
-            </script>
-        </body>
-        </html>
-        """
-        # Экранирование
-        escaped_html = html.replace('\\', '\\\\').replace('`', '\\`').replace('${', '\\${')
         return f"""
-        <div style="text-align: center; padding: 30px; background: white; border-radius: 10px;">
-            <h3 style="color: #2c3e50; margin-bottom: 20px;">✅ Interactive lesson is ready!</h3>
-            <button onclick="openLesson()" style="background: #27ae60; color: white; padding: 15px 40px; font-size: 18px; border: none; border-radius: 8px; cursor: pointer; box-shadow: 0 4px 6px rgba(0,0,0,0.1);">
-                📖 Open Interactive Lesson
-            </button>
-        </div>
-        <script>
-        function openLesson() {{
-            var w = window.open('', '_blank');
-            w.document.write(`{escaped_html}`);
-            w.document.close();
-        }}
-        </script>
-        """
     except Exception as e:
         traceback.print_exc()
-        return f"<p style='color: red;'>❌ Error: {str(e)}</p>"
 # Интерфейс
-with gr.Blocks(theme=gr.themes.Soft(), title="Video Lecturer") as iface:
     gr.Markdown("""
-    # 🎓 AI Video Lecturer
-    Upload your photo and enter lecture text in Russian. AI will translate to Kazakh/English and create a video lecture!
-    **Requirements:**
-    - 📸 Photo: Clear frontal face photo
-    - 📝 Text: In Russian, max 500 characters
     """)
     with gr.Row():
-        with gr.Column():
-            image_input = gr.Image(type="pil", label="📸 Lecturer Photo")
             text_input = gr.Textbox(
                 lines=6,
-                placeholder="Example: Hello! Today we will talk about mathematics...",
-                label="📝 Lecture Text (Russian, max 500 chars)"
             )
-            generate_video_btn = gr.Button("🎬 Generate Video", variant="primary", size="lg")
-        with gr.Column():
-            video_output = gr.Video(label="🎬 Generated Video")
-            status = gr.Textbox(label="ℹ️ Status", interactive=False)
-    interactive_btn = gr.Button("📚 Create Interactive Lesson", visible=False, variant="secondary", size="lg")
     lesson_output = gr.HTML(visible=False)
-    def show_interactive_btn(video, status_msg):
         return gr.update(visible=bool(video and "✅" in status_msg))
-    generate_video_btn.click(
         inference,
         inputs=[image_input, text_input],
         outputs=[video_output, status]
     ).then(
-        show_interactive_btn,
         inputs=[video_output, status],
         outputs=interactive_btn
     )
@@ -411,4 +393,8 @@ with gr.Blocks(theme=gr.themes.Soft(), title="Video Lecturer") as iface:
     )
 if __name__ == "__main__":
-    iface.launch()

 import tempfile
 from gradio_client import Client, handle_file
 import torch
+from transformers import VitsModel, AutoTokenizer
 import scipy.io.wavfile as wavfile
 import traceback
 import base64
 import random
+# Принудительно CPU и минимальное использование памяти
+os.environ['CUDA_VISIBLE_DEVICES'] = ''
+torch.set_num_threads(2)  # Ограничение потоков CPU
+device = "cpu"
+print(f"Using device: {device} (optimized mode)")
+# Глобальные переменные
 tts_model = None
 tts_tokenizer = None
 TALKING_HEAD_SPACE = "Skywork/skyreels-a1-talking-head"
+def load_tts_model():
+    """Загрузка только TTS модели"""
+    global tts_model, tts_tokenizer
+    if tts_model is None:
+        print("Загрузка TTS модели (казахский)...")
+        tts_model = VitsModel.from_pretrained(
+            "facebook/mms-tts-kaz",
+            torch_dtype=torch.float32,
+            low_cpu_mem_usage=True
+        )
+        tts_model.eval()  # Режим инференса
+        tts_tokenizer = AutoTokenizer.from_pretrained("facebook/mms-tts-kaz")
+        print("✓ TTS модель загружена")
+    return True
+def simple_translate_to_kazakh(russian_text):
+    """
+    Упрощенная транслитерация/перевод без тяжелых моделей
+    Для реального использования нужна легкая модель или API
+    """
+    # Простая замена для базовых слов (демо)
+    translations = {
+        'привет': 'сәлем',
+        'здравствуйте': 'сәлеметсіздер ме',
+        'спасибо': 'рахмет',
+        'пожалуйста': 'өтінемін',
+        'да': 'иә',
+        'нет': 'жоқ',
+        'сегодня': 'бүгін',
+        'завтра': 'ертең',
+        'математика': 'математика',
+        'физика': 'физика',
+        'урок': 'сабақ',
+        'лекция': 'дәріс',
+        'студент': 'студент',
+        'учитель': 'мұғалім',
+        'школа': 'мектеп',
+        'университет': 'университет',
+        'знание': 'білім',
+        'книга': 'кітап',
+        'вопрос': 'сұрақ',
+        'ответ': 'жауап'
+    }
+    text_lower = russian_text.lower()
+    result = russian_text
+    for ru, kk in translations.items():
+        result = result.replace(ru, kk)
+        result = result.replace(ru.capitalize(), kk.capitalize())
+    return result
 def inference(image: Image.Image, text: str):
     error_msg = ""
     img_path = None
     try:
+        # Загрузка TTS
+        if not load_tts_model():
+            raise RuntimeError("Не удалось загрузить TTS модель")
         # Валидация
         if image is None:
             raise ValueError("Загрузите изображение лектора!")
         if not text or not text.strip():
+            raise ValueError("Введите текст лекции!")
         if len(text) > 500:
+            raise ValueError("Текст слишком длинный! Максимум 500 символов.")
+        print(f"Входной текст: '{text[:50]}...'")
+        # Простой перевод на казахский
+        translated_text = simple_translate_to_kazakh(text)
         print(f"Переведенный текст: '{translated_text[:50]}...'")
+        # Генерация аудио с оптимизацией памяти
+        print("Генерация аудио...")
         with torch.no_grad():
+            inputs = tts_tokenizer(translated_text, return_tensors="pt", truncation=True, max_length=512)
+            # Освобождение памяти перед генерацией
+            if torch.cuda.is_available():
+                torch.cuda.empty_cache()
             output = tts_model(**inputs)
             waveform = output.waveform.squeeze().cpu().numpy()
+            # Очистка
+            del inputs, output
         if waveform.size == 0:
             raise ValueError("TTS сгенерировал пустое аудио!")
+        # Сохранение аудио
         audio = (waveform * 32767).astype("int16")
         sampling_rate = tts_model.config.sampling_rate
             wavfile.write(audio_file.name, sampling_rate, audio)
             audio_path = audio_file.name
+        print(f"✓ Аудио: {audio_path} ({len(waveform)/sampling_rate:.1f} сек)")
+        # Оптимизация изображения
+        print("Обработка изображения...")
+        if image.mode != 'RGB':
+            image = image.convert('RGB')
+        # Уменьшаем размер если слишком большое (экономия памяти)
+        max_size = 1024
+        if max(image.size) > max_size:
+            ratio = max_size / max(image.size)
+            new_size = tuple(int(dim * ratio) for dim in image.size)
+            image = image.resize(new_size, Image.Resampling.LANCZOS)
+            print(f"Изображение уменьшено до {new_size}")
         with tempfile.NamedTemporaryFile(suffix=".png", delete=False) as img_file:
+            image.save(img_file.name, format='PNG', optimize=True)
             img_path = img_file.name
+        print(f"✓ Изображение: {img_path}")
+        # Вызов Talking Head API
         print(f"Подключение к {TALKING_HEAD_SPACE}...")
+        client = Client(TALKING_HEAD_SPACE, verbose=False)
         result = client.predict(
             image_path=handle_file(img_path),
             audio_path=handle_file(audio_path),
+            guidance_scale=2.5,  # Снижено для скорости
+            steps=8,  # Меньше шагов = быстрее
             api_name="/process_image_audio"
         )
         if not video_path or not os.path.exists(video_path):
             raise ValueError("Видео не сгенерировано!")
+        print(f"✓ Видео: {video_path}")
         error_msg = "✅ Бейне сәтті жасалды!"
     except Exception as e:
+        error_msg = f"❌ Қате: {str(e)}"
         print(f"ОШИБКА: {error_msg}")
         traceback.print_exc()
     finally:
+        # Очистка временных файлов
         for path in [audio_path, img_path]:
             if path and os.path.exists(path):
                 try:
     return video_path, error_msg
 def generate_interactive_lesson(text, video_path):
+    """Упрощенная версия без тяжелых моделей QA"""
     try:
         if not video_path or not os.path.exists(video_path):
+            return "<p style='color: red;'>❌ Алдымен бейнені жасаңыз!</p>"
+        # Простая генерация вопросов без ML моделей
+        sentences = text.split('.')[:3]  # Первые 3 предложения
         questions = []
         for i, sent in enumerate(sentences):
+            sent = sent.strip()
             if len(sent) < 10:
                 continue
+            # Простые шаблоны вопросов
+            words = sent.split()
+            if len(words) < 3:
                 continue
+            # Генерируем вопрос на основе шаблона
+            question_templates = [
+                f"Не сказано о {words[0].lower()}?",
+                f"Что упоминается в тексте о {words[1].lower() if len(words) > 1 else 'теме'}?",
+                f"Какая информация дана о {words[2].lower() if len(words) > 2 else 'содержании'}?"
+            ]
+            question = random.choice(question_templates)
+            # Правильный ответ - часть предложения
+            correct = ' '.join(words[:min(5, len(words))])
+            # Неправильные ответы
+            wrong_options = [
+                "Бұл туралы айтылмаған",
+                "Мәтінде жоқ",
+                "Дұрыс емес жауап"
+            ]
+            wrong = random.choice(wrong_options)
+            questions.append({
+                "question": question,
+                "correct": correct,
+                "wrong": wrong
+            })
         if not questions:
+            # Создаем хотя бы один вопрос
+            questions.append({
+                "question": "Дәрістің негізгі тақырыбы не?",
+                "correct": text.split('.')[0][:50] if text else "Білім",
+                "wrong": "Спорт туралы"
+            })
+        # Base64 видео (оптимизировано)
+        print("Кодирование видео в base64...")
         with open(video_path, 'rb') as f:
+            video_data = f.read()
+            # Проверка размера
+            if len(video_data) > 50 * 1024 * 1024:  # 50MB
+                return "<p style='color: orange;'>⚠️ Видео слишком большое для встраивания. Скачайте его отдельно.</p>"
+            video_base64 = base64.b64encode(video_data).decode('utf-8')
+        # Минимальный HTML
         html = f"""<!DOCTYPE html>
+<html>
+<head>
+    <meta charset="UTF-8">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
+    <title>Интерактивті сабақ</title>
+    <style>
+        * {{ margin: 0; padding: 0; box-sizing: border-box; }}
+        body {{ font-family: Arial, sans-serif; max-width: 800px; margin: 0 auto; padding: 15px; background: #f5f5f5; }}
+        h1 {{ color: #333; text-align: center; margin: 20px 0; font-size: 24px; }}
+        video {{ width: 100%; max-width: 600px; display: block; margin: 20px auto; border-radius: 8px; box-shadow: 0 2px 8px rgba(0,0,0,0.1); }}
+        .text {{ background: white; padding: 15px; margin: 20px 0; border-radius: 8px; box-shadow: 0 2px 4px rgba(0,0,0,0.1); }}
+        .q {{ background: white; padding: 15px; margin: 15px 0; border-radius: 8px; box-shadow: 0 2px 4px rgba(0,0,0,0.1); }}
+        button {{ background: #4CAF50; color: white; padding: 10px 20px; border: none; border-radius: 5px; cursor: pointer; margin-top: 10px; }}
+        button:hover {{ background: #45a049; }}
+        .fb {{ margin-top: 10px; padding: 8px; border-radius: 5px; font-weight: bold; }}
+        label {{ cursor: pointer; }}
+    </style>
+</head>
+<body>
+    <h1>📚 Интерактивті сабақ</h1>
+    <video controls><source src="data:video/mp4;base64,{video_base64}" type="video/mp4"></video>
+    <div class="text"><strong>Дәріс мәтіні:</strong> {text[:500]}</div>
+    <h2 style="text-align:center; margin: 20px 0;">Тесттер:</h2>
+"""
         for i, q in enumerate(questions):
+            ca = q['correct'].replace("'", "\\'").replace('"', '&quot;')
             html += f"""
+    <div class="q">
+        <p><strong>Сұрақ {i+1}:</strong> {q['question']}</p>
+        <div style="margin: 10px 0;">
+            <input type="radio" name="q{i}" value="c" id="c{i}">
+            <label for="c{i}">{q['correct']}</label><br>
+            <input type="radio" name="q{i}" value="w" id="w{i}">
+            <label for="w{i}">{q['wrong']}</label>
+        </div>
+        <button onclick="check({i},'{ca}')">Тексеру</button>
+        <div class="fb" id="fb{i}"></div>
+    </div>
+"""
         html += """
+    <script>
+    function check(i, c) {
+        var s = document.querySelector('input[name="q'+i+'"]:checked');
+        var f = document.getElementById('fb'+i);
+        if(!s) { f.innerHTML='⚠️ Жауап таңдаңыз!'; f.style.background='#fff3cd'; f.style.color='#856404'; return; }
+        if(s.value==='c') { f.innerHTML='✅ Дұрыс!'; f.style.background='#d4edda'; f.style.color='#155724'; }
+        else { f.innerHTML='❌ Қате. Дұрыс: '+c; f.style.background='#f8d7da'; f.style.color='#721c24'; }
+    }
+    </script>
+</body>
+</html>"""
+        escaped = html.replace('\\', '\\\\').replace('`', '\\`').replace('${', '\\${')
         return f"""
+<div style="text-align:center; padding: 20px; background: white; border-radius: 8px;">
+    <h3 style="color: #2c3e50;">✅ Интерактивті сабақ дайын!</h3>
+    <button onclick="var w=window.open('','_blank');w.document.write(`{escaped}`);w.document.close();"
+            style="background: #27ae60; color: white; padding: 15px 30px; font-size: 16px; border: none;
+            border-radius: 8px; cursor: pointer; margin-top: 15px; box-shadow: 0 4px 6px rgba(0,0,0,0.1);">
+        📖 Интерактивті сабақты ашу
+    </button>
+</div>
+"""
     except Exception as e:
         traceback.print_exc()
+        return f"<p style='color: red;'>❌ Қате: {str(e)}</p>"
 # Интерфейс
+with gr.Blocks(theme=gr.themes.Soft(), title="Бейне Оқытушы", css="""
+    .gradio-container {max-width: 1200px !important;}
+    footer {display: none !important;}
+""") as iface:
     gr.Markdown("""
+    # 🎓 Бейне Оқытушы (CPU Оптимизацияланған)
+    **Қалай пайдалану:**
+    1. 📸 Суретіңізді жүктеңіз (бет анық көрінетін)
+    2. 📝 Дәріс мәтінін орыс тілінде енгізіңіз (500 таңбаға дейін)
+    3. 🎬 "Бейнені жасау" батырмасын басыңыз
+    4. 📚 Дайын болғаннан кейін "Интерактивті сабақ" жасай аласыз
+    ⚡ **Ескерту:** CPU режимінде жұмыс істейді, генерация 1-3 минут алуы мүмкін.
     """)
     with gr.Row():
+        with gr.Column(scale=1):
+            image_input = gr.Image(type="pil", label="📸 Дәріскер суреті")
             text_input = gr.Textbox(
                 lines=6,
+                placeholder="Мысалы: Сәлеметсіздер ме! Бүгін біз математика туралы сөйлесеміз...",
+                label="📝 Дәріс мәтіні (орыс тілінде)"
             )
+            generate_btn = gr.Button("🎬 Бейнені жасау", variant="primary", size="lg")
+        with gr.Column(scale=1):
+            video_output = gr.Video(label="🎬 Дайын бейне")
+            status = gr.Textbox(label="ℹ️ Мәртебе", interactive=False)
+    interactive_btn = gr.Button("📚 Интерактивті сабақ жасау", visible=False, variant="secondary")
     lesson_output = gr.HTML(visible=False)
+    def show_lesson_btn(video, status_msg):
         return gr.update(visible=bool(video and "✅" in status_msg))
+    generate_btn.click(
         inference,
         inputs=[image_input, text_input],
         outputs=[video_output, status]
     ).then(
+        show_lesson_btn,
         inputs=[video_output, status],
         outputs=interactive_btn
     )
     )
 if __name__ == "__main__":
+    iface.launch(
+        server_name="0.0.0.0",
+        server_port=7860,
+        share=False
+    )