Spaces:

akhaliq
/

anycoder

Running

akhaliq HF Staff commited on 24 days ago

Commit

7523755

1 Parent(s): 0fb9638

Fix streaming and use proper system prompts

Issues fixed:
1. Streaming not working properly - code only appeared at the end
2. Not using language-specific prompts from prompts.py

Backend changes (backend_api.py):
- Import system prompts from anycoder_app/prompts.py
- Initialize Gradio and ComfyUI prompts on startup via docs_manager
- Use language-specific prompts (HTML, Gradio, Streamlit, React, etc.)
- Add proper system prompt selection based on language parameter
- Improve streaming with smaller sleep intervals (0.01s) for immediate flush
- Add chunk counting and logging for debugging
- Add detailed logging for prompt selection

Frontend changes (page.tsx, api.ts):
- Add console logging to track chunk reception
- Log SSE events for debugging
- Log buffer sizes and chunk lengths
- Track generation completion with total code length

This ensures:
✅ Proper language-specific prompts are used (HTML, Gradio, Streamlit, etc.)
✅ Streaming works immediately with chunks appearing in real-time
✅ Better debugging with console logs
✅ Backend properly flushes chunks to frontend

Files changed (3) hide show

backend_api.py +43 -3
frontend/src/app/page.tsx +2 -0
frontend/src/lib/api.ts +3 -0

backend_api.py CHANGED Viewed

@@ -19,6 +19,30 @@ import os
 from huggingface_hub import InferenceClient
 import httpx
 # Define models and languages here to avoid importing Gradio UI
 AVAILABLE_MODELS = [
     {"name": "Sherlock Dash Alpha", "id": "openrouter/sherlock-dash-alpha", "description": "Sherlock Dash Alpha model via OpenRouter"},
@@ -310,8 +334,18 @@ async def generate_code(
             # Track generated code
             generated_code = ""
-            # Use a simple system prompt
-            system_prompt = "You are a helpful AI assistant that generates code based on user requirements. Generate clean, well-commented code."
             # Get the real model ID
             actual_model_id = selected_model["id"]
@@ -372,6 +406,7 @@ async def generate_code(
                     stream=True
                 )
                 for chunk in stream:
                     # Check if choices array has elements before accessing
                     if (hasattr(chunk, 'choices') and
@@ -382,6 +417,7 @@ async def generate_code(
                         chunk.choices[0].delta.content):
                         content = chunk.choices[0].delta.content
                         generated_code += content
                         # Send chunk as Server-Sent Event
                         event_data = json.dumps({
@@ -390,7 +426,11 @@ async def generate_code(
                             "timestamp": datetime.now().isoformat()
                         })
                         yield f"data: {event_data}\n\n"
-                        await asyncio.sleep(0)  # Allow other tasks to run
                 # Send completion event
                 completion_data = json.dumps({

 from huggingface_hub import InferenceClient
 import httpx
+# Import system prompts for code generation
+from anycoder_app.prompts import (
+    HTML_SYSTEM_PROMPT,
+    TRANSFORMERS_JS_SYSTEM_PROMPT,
+    STREAMLIT_SYSTEM_PROMPT,
+    REACT_SYSTEM_PROMPT,
+    GRADIO_SYSTEM_PROMPT,
+    JSON_SYSTEM_PROMPT,
+    GENERIC_SYSTEM_PROMPT
+)
+# Initialize Gradio and ComfyUI prompts on startup
+try:
+    from anycoder_app.docs_manager import update_gradio_system_prompts, update_json_system_prompts
+    print("[Startup] Initializing Gradio and ComfyUI system prompts...")
+    update_gradio_system_prompts()
+    update_json_system_prompts()
+    # Re-import to get updated prompts
+    from anycoder_app.prompts import GRADIO_SYSTEM_PROMPT, JSON_SYSTEM_PROMPT
+    print("[Startup] System prompts initialized successfully")
+except Exception as e:
+    print(f"[Startup] Warning: Could not initialize dynamic prompts: {e}")
+    print("[Startup] Will use fallback prompts")
 # Define models and languages here to avoid importing Gradio UI
 AVAILABLE_MODELS = [
     {"name": "Sherlock Dash Alpha", "id": "openrouter/sherlock-dash-alpha", "description": "Sherlock Dash Alpha model via OpenRouter"},
             # Track generated code
             generated_code = ""
+            # Select appropriate system prompt based on language
+            prompt_map = {
+                "html": HTML_SYSTEM_PROMPT,
+                "gradio": GRADIO_SYSTEM_PROMPT,
+                "streamlit": STREAMLIT_SYSTEM_PROMPT,
+                "transformers.js": TRANSFORMERS_JS_SYSTEM_PROMPT,
+                "react": REACT_SYSTEM_PROMPT,
+                "comfyui": JSON_SYSTEM_PROMPT,
+            }
+            system_prompt = prompt_map.get(language, GENERIC_SYSTEM_PROMPT.format(language=language))
+            print(f"[Generate] Using {language} prompt for query: {query[:100]}...")
             # Get the real model ID
             actual_model_id = selected_model["id"]
                     stream=True
                 )
+                chunk_count = 0
                 for chunk in stream:
                     # Check if choices array has elements before accessing
                     if (hasattr(chunk, 'choices') and
                         chunk.choices[0].delta.content):
                         content = chunk.choices[0].delta.content
                         generated_code += content
+                        chunk_count += 1
                         # Send chunk as Server-Sent Event
                         event_data = json.dumps({
                             "timestamp": datetime.now().isoformat()
                         })
                         yield f"data: {event_data}\n\n"
+                        # Ensure immediate flush to client
+                        await asyncio.sleep(0.01)  # Small delay to ensure flushing
+                print(f"[Generate] Completed with {chunk_count} chunks, total length: {len(generated_code)}")
                 # Send completion event
                 completion_data = json.dumps({

frontend/src/app/page.tsx CHANGED Viewed

@@ -79,6 +79,8 @@ export default function Home() {
         // onChunk - Update code editor in real-time, NOT the chat
         (chunk: string) => {
           generatedCodeBuffer += chunk;
           setGeneratedCode(generatedCodeBuffer);
         },
         // onComplete

         // onChunk - Update code editor in real-time, NOT the chat
         (chunk: string) => {
           generatedCodeBuffer += chunk;
+          console.log('[Stream] Received chunk:', chunk.substring(0, 50), '... (length:', chunk.length, ')');
+          console.log('[Stream] Buffer size:', generatedCodeBuffer.length);
           setGeneratedCode(generatedCodeBuffer);
         },
         // onComplete

frontend/src/lib/api.ts CHANGED Viewed

@@ -119,13 +119,16 @@ class ApiClient {
     eventSource.onmessage = (event) => {
       try {
         const data = JSON.parse(event.data);
         if (data.type === 'chunk' && data.content) {
           onChunk(data.content);
         } else if (data.type === 'complete' && data.code) {
           onComplete(data.code);
           eventSource.close();
         } else if (data.type === 'error') {
           onError(data.message || 'Unknown error occurred');
           eventSource.close();
         }

     eventSource.onmessage = (event) => {
       try {
         const data = JSON.parse(event.data);
+        console.log('[SSE] Received event:', data.type, data.content?.substring(0, 30));
         if (data.type === 'chunk' && data.content) {
           onChunk(data.content);
         } else if (data.type === 'complete' && data.code) {
+          console.log('[SSE] Generation complete, total code length:', data.code.length);
           onComplete(data.code);
           eventSource.close();
         } else if (data.type === 'error') {
+          console.error('[SSE] Error:', data.message);
           onError(data.message || 'Unknown error occurred');
           eventSource.close();
         }