Spaces:

MCP-1st-Birthday
/

A.R.I.A-Autonomous_Rendering_and_Imaging_Agent

Running

App Files Files Community

byte-vortex commited on Nov 21, 2025

Commit

bd160cc

verified ·

1 Parent(s): a74fdb7

Update app.py

Browse files

Files changed (1) hide show

app.py +59 -35

app.py CHANGED Viewed

@@ -17,13 +17,35 @@ DEFAULT_SIZE = 512
 MAX_SEED = np.iinfo(np.int32).max
 # -----------------------------
-# 1. System & Model Setup
 # -----------------------------
 class MockPipe:
     """A dummy pipeline for testing without a GPU."""
     def __call__(self, *args, **kwargs):
-        time.sleep(1.5) # Simulate "thinking" time
         color = kwargs.get('color_hint', 'red')
         return type('obj', (object,), {'images': [Image.new('RGB', (512, 512), color=color)]})
@@ -42,28 +64,12 @@ try:
             requires_safety_checker=False
         ).to(device)
     else:
-        # Fallback for CPU
         pipe = MockPipe()
         print("⚠️ GPU not found. Using MockPipe for UI demonstration.")
 except Exception as e:
     print(f"⚠️ Model failed to load. Using MockPipe. Error: {e}")
     pipe = MockPipe()
-# -----------------------------
-# 2. Configuration & Logic
-# -----------------------------
-PANEL_V1_PRESETS = {
-    "Oil Painting 🎨": {"prompt": "Oil painting, heavy impasto, visible brushstrokes, masterpiece", "neg": "photorealistic, smooth, digital", "str": 0.80},
-    "Ink Illustration ✒️": {"prompt": "Ink and watercolor sketch, loose lines, artistic, intricate details", "neg": "3d render, solid colors", "str": 0.70},
-    "Noir Photography 📸": {"prompt": "High contrast black and white photography, film grain, dramatic shadows", "neg": "color, soft, painting", "str": 0.65},
-}
-PANEL_V2_PRESETS = {
-    "Cyberpunk City 🌆": {"prompt": "Cyberpunk atmosphere, neon lights, rain, volumetric fog, futuristic", "neg": "daylight, rustic, vintage", "str": 0.55},
-    "Scenic Anime 🗾": {"prompt": "High quality anime background art, hand-painted style, cumulus clouds, rolling hills, vibrant nature", "neg": "dark, gritty, horror, realism, sketch", "str": 0.60},
-    "Retro Vaporwave 📼": {"prompt": "Vaporwave aesthetic, pink and purple gradient lighting, VHS glitch effect", "neg": "high definition, neutral colors", "str": 0.50},
-}
 class AriaAgent:
     def __init__(self, pipe, device):
         self.pipe = pipe
@@ -71,38 +77,40 @@ class AriaAgent:
     def generate_reasoning(self, phase, tool_name, strength, user_intent):
         """Generates 'Chain of Thought' internal monologue text."""
         if phase == "analysis":
             return (
                 f"💭 THOUGHT: Analyzing input signal data...\n"
-                f"   > Observation: User provided semantic intent: '{user_intent}'\n"
                 f"   > Assessment: Input image requires stylistic abstraction.\n"
-                f"   > Strategy: I will split the task into Structure (Step 1) and Atmosphere (Step 2)."
             )
         elif phase == "step1":
             return (
                 f"💭 THOUGHT: Executing Foundation Layer.\n"
                 f"   > Selection: Tool '{tool_name}' chosen to break photorealism.\n"
                 f"   > Parameter Reasoning: Setting denoising strength to {strength:.2f}.\n"
-                f"     - Rationale: A high value is needed to overwrite original textures while keeping composition.\n"
                 f"   > Action: Injecting latent noise vectors..."
             )
         elif phase == "step2":
             return (
                 f"💭 THOUGHT: Refining Atmospheric Context.\n"
                 f"   > Selection: Tool '{tool_name}' chosen for lighting and mood.\n"
-                f"   > Parameter Reasoning: Reducing strength to {strength:.2f} to preserve the Step 1 strokes.\n"
-                f"   > Optimization: Aligning vector guidance with '{user_intent}'.\n"
                 f"   > Action: Final render pass initiating."
             )
         return ""
     def generate(self, image, prompt, neg, strength, steps, guide, seed):
-        # Mock generation logic for 'MockPipe'
         if isinstance(self.pipe, MockPipe):
             color = '#8b5cf6' if "Style" in prompt else '#10b981'
             return self.pipe(color_hint=color).images[0]
-        # Real generation logic
         with torch.inference_mode():
             image = image.resize((DEFAULT_SIZE, DEFAULT_SIZE))
             gen = torch.Generator(device=self.device).manual_seed(seed)
@@ -126,19 +134,22 @@ def run_ui_stream(
     if init_img is None:
         raise gr.Error("Please upload an input image first.")
     # 1. Initialization
     if rnd: seed = random.randint(0, MAX_SEED)
     gallery_state.append((init_img, "1. Input Signal"))
     # --- COT: Analysis Phase ---
-    analysis_thought = agent.generate_reasoning("analysis", "", 0, user_p if user_p else "General Transformation")
     logs.append(analysis_thought)
     yield "\n\n".join(logs), gallery_state, seed, "🤔 ANALYZING"
-    time.sleep(0.8) # Pause to let user read the "thought"
     # --- COT: Step 1 Planning ---
     p1 = PANEL_V1_PRESETS[v1_key]
     final_str_1 = min(1.0, p1['str'] * strength_mult)
     step1_thought = agent.generate_reasoning("step1", v1_key, final_str_1, user_p)
@@ -153,7 +164,9 @@ def run_ui_stream(
     yield "\n\n".join(logs), gallery_state, seed, "👀 OBSERVING"
     # --- COT: Step 2 Planning ---
     p2 = PANEL_V2_PRESETS[v2_key]
     step2_thought = agent.generate_reasoning("step2", v2_key, p2['str'], user_p)
     logs.append(step2_thought)
     yield "\n\n".join(logs), gallery_state, seed, "🌫️ ATMOSPHERE"
@@ -183,10 +196,10 @@ h1 {
     text-shadow: 0 0 10px rgba(56, 189, 248, 0.5);
 }
-/* FIXED: Subtitle is now bright Amber for high contrast */
 .subtitle {
     font-family: 'Space Mono', monospace;
-    color: #fbbf24; /* Amber-400 */
     font-weight: bold;
     font-size: 1.0rem;
     letter-spacing: 1px;
@@ -209,10 +222,9 @@ h1 {
 }
 #run-btn:hover { transform: scale(1.02); box-shadow: 0 0 25px rgba(139, 92, 246, 0.7); }
-/* Styled to look like a terminal code block */
 #log-output-box textarea {
     background-color: #0d1117 !important;
-    color: #4ade80 !important; /* Matrix Green text */
     font-family: 'Space Mono', monospace !important;
     font-size: 0.85rem !important;
     border: 1px solid #30363d !important;
@@ -245,7 +257,6 @@ with gr.Blocks(theme=theme, css=hackathon_css, title="A.R.I.A. Agent") as demo:
     with gr.Row(elem_classes="header-row"):
         with gr.Column(scale=6):
             gr.Markdown(f"# 🧬 {APP_TITLE}")
-            # Subtitle class applied here
             gr.HTML(f"<span class='subtitle'>{APP_SUBTITLE}</span>")
         with gr.Column(scale=2):
             status_display = gr.Textbox(value="🟢 SYSTEM READY", label="Agent Status", interactive=False, elem_id="status-bar")
@@ -263,9 +274,22 @@ with gr.Blocks(theme=theme, css=hackathon_css, title="A.R.I.A. Agent") as demo:
                 gr.Markdown("### 🕹️ 2. Parameters")
                 user_prompt = gr.Textbox(label="Creative Guidance", placeholder="E.g. 'A futuristic city at night'...", lines=2)
                 with gr.Row():
-                    v1_select = gr.Dropdown(label="Tool A: Foundation", choices=list(PANEL_V1_PRESETS.keys()), value="Oil Painting 🎨")
-                    v2_select = gr.Dropdown(label="Tool B: Atmosphere", choices=list(PANEL_V2_PRESETS.keys()), value="Scenic Anime 🗾")
                 strength_mult_slide = gr.Slider(label="Concept Divergence", minimum=0.2, maximum=1.0, value=0.9, step=0.05)

 MAX_SEED = np.iinfo(np.int32).max
 # -----------------------------
+# 1. Configuration & Presets
+# -----------------------------
+# Defining these as lists first ensures consistency between UI and Logic
+PANEL_V1_PRESETS = {
+    "Oil Painting 🎨": {"prompt": "Oil painting, heavy impasto, visible brushstrokes, masterpiece", "neg": "photorealistic, smooth, digital", "str": 0.80},
+    "Ink Illustration ✒️": {"prompt": "Ink and watercolor sketch, loose lines, artistic, intricate details", "neg": "3d render, solid colors", "str": 0.70},
+    "Noir Photography 📸": {"prompt": "High contrast black and white photography, film grain, dramatic shadows", "neg": "color, soft, painting", "str": 0.65},
+    "Watercolor 💧": {"prompt": "Soft watercolor painting, bleeding edges, wet on wet, paper texture", "neg": "harsh lines, digital, opaque", "str": 0.75},
+}
+PANEL_V2_PRESETS = {
+    "Scenic Anime 🗾": {"prompt": "High quality anime background art, hand-painted style, cumulus clouds, rolling hills, vibrant nature", "neg": "dark, gritty, horror, realism, sketch", "str": 0.60},
+    "Cyberpunk City 🌆": {"prompt": "Cyberpunk atmosphere, neon lights, rain, volumetric fog, futuristic", "neg": "daylight, rustic, vintage", "str": 0.55},
+    "Retro Vaporwave 📼": {"prompt": "Vaporwave aesthetic, pink and purple gradient lighting, VHS glitch effect", "neg": "high definition, neutral colors", "str": 0.50},
+    "Ethereal Fantasy ✨": {"prompt": "Dreamy fantasy atmosphere, soft glowing light, magical particles, celestial", "neg": "dark, scary, industrial", "str": 0.60},
+}
+V1_KEYS = list(PANEL_V1_PRESETS.keys())
+V2_KEYS = list(PANEL_V2_PRESETS.keys())
+# -----------------------------
+# 2. System & Model Setup
 # -----------------------------
 class MockPipe:
     """A dummy pipeline for testing without a GPU."""
     def __call__(self, *args, **kwargs):
+        time.sleep(1.0) # Simulate "thinking" time
         color = kwargs.get('color_hint', 'red')
         return type('obj', (object,), {'images': [Image.new('RGB', (512, 512), color=color)]})
             requires_safety_checker=False
         ).to(device)
     else:
         pipe = MockPipe()
         print("⚠️ GPU not found. Using MockPipe for UI demonstration.")
 except Exception as e:
     print(f"⚠️ Model failed to load. Using MockPipe. Error: {e}")
     pipe = MockPipe()
 class AriaAgent:
     def __init__(self, pipe, device):
         self.pipe = pipe
     def generate_reasoning(self, phase, tool_name, strength, user_intent):
         """Generates 'Chain of Thought' internal monologue text."""
+        # Fallback if user prompt is empty
+        context_intent = user_intent if user_intent.strip() else "Artistic Enhancement"
         if phase == "analysis":
             return (
                 f"💭 THOUGHT: Analyzing input signal data...\n"
+                f"   > Observation: User semantic intent: '{context_intent}'\n"
                 f"   > Assessment: Input image requires stylistic abstraction.\n"
+                f"   > Strategy: Split task -> Structure (Step 1) + Atmosphere (Step 2)."
             )
         elif phase == "step1":
             return (
                 f"💭 THOUGHT: Executing Foundation Layer.\n"
                 f"   > Selection: Tool '{tool_name}' chosen to break photorealism.\n"
                 f"   > Parameter Reasoning: Setting denoising strength to {strength:.2f}.\n"
+                f"     - Rationale: Overwriting original textures while keeping composition.\n"
                 f"   > Action: Injecting latent noise vectors..."
             )
         elif phase == "step2":
             return (
                 f"💭 THOUGHT: Refining Atmospheric Context.\n"
                 f"   > Selection: Tool '{tool_name}' chosen for lighting and mood.\n"
+                f"   > Parameter Reasoning: Reducing strength to {strength:.2f} to preserve Step 1 strokes.\n"
+                f"   > Optimization: Aligning vector guidance with '{context_intent}'.\n"
                 f"   > Action: Final render pass initiating."
             )
         return ""
     def generate(self, image, prompt, neg, strength, steps, guide, seed):
         if isinstance(self.pipe, MockPipe):
             color = '#8b5cf6' if "Style" in prompt else '#10b981'
             return self.pipe(color_hint=color).images[0]
         with torch.inference_mode():
             image = image.resize((DEFAULT_SIZE, DEFAULT_SIZE))
             gen = torch.Generator(device=self.device).manual_seed(seed)
     if init_img is None:
         raise gr.Error("Please upload an input image first.")
     # 1. Initialization
     if rnd: seed = random.randint(0, MAX_SEED)
     gallery_state.append((init_img, "1. Input Signal"))
     # --- COT: Analysis Phase ---
+    analysis_thought = agent.generate_reasoning("analysis", "", 0, user_p)
     logs.append(analysis_thought)
     yield "\n\n".join(logs), gallery_state, seed, "🤔 ANALYZING"
+    time.sleep(0.5)
     # --- COT: Step 1 Planning ---
+    # Safety check for keys
+    if v1_key not in PANEL_V1_PRESETS: v1_key = V1_KEYS[0]
     p1 = PANEL_V1_PRESETS[v1_key]
     final_str_1 = min(1.0, p1['str'] * strength_mult)
     step1_thought = agent.generate_reasoning("step1", v1_key, final_str_1, user_p)
     yield "\n\n".join(logs), gallery_state, seed, "👀 OBSERVING"
     # --- COT: Step 2 Planning ---
+    if v2_key not in PANEL_V2_PRESETS: v2_key = V2_KEYS[0]
     p2 = PANEL_V2_PRESETS[v2_key]
     step2_thought = agent.generate_reasoning("step2", v2_key, p2['str'], user_p)
     logs.append(step2_thought)
     yield "\n\n".join(logs), gallery_state, seed, "🌫️ ATMOSPHERE"
     text-shadow: 0 0 10px rgba(56, 189, 248, 0.5);
 }
+/* Bright Amber Subtitle for Visibility */
 .subtitle {
     font-family: 'Space Mono', monospace;
+    color: #fbbf24; /* Amber */
     font-weight: bold;
     font-size: 1.0rem;
     letter-spacing: 1px;
 }
 #run-btn:hover { transform: scale(1.02); box-shadow: 0 0 25px rgba(139, 92, 246, 0.7); }
 #log-output-box textarea {
     background-color: #0d1117 !important;
+    color: #4ade80 !important; /* Matrix Green */
     font-family: 'Space Mono', monospace !important;
     font-size: 0.85rem !important;
     border: 1px solid #30363d !important;
     with gr.Row(elem_classes="header-row"):
         with gr.Column(scale=6):
             gr.Markdown(f"# 🧬 {APP_TITLE}")
             gr.HTML(f"<span class='subtitle'>{APP_SUBTITLE}</span>")
         with gr.Column(scale=2):
             status_display = gr.Textbox(value="🟢 SYSTEM READY", label="Agent Status", interactive=False, elem_id="status-bar")
                 gr.Markdown("### 🕹️ 2. Parameters")
                 user_prompt = gr.Textbox(label="Creative Guidance", placeholder="E.g. 'A futuristic city at night'...", lines=2)
+                # Dropdowns placed here. interactive=True is KEY.
                 with gr.Row():
+                    v1_select = gr.Dropdown(
+                        label="Tool A: Foundation",
+                        choices=V1_KEYS,
+                        value=V1_KEYS[0],
+                        interactive=True,
+                        min_width=150
+                    )
+                    v2_select = gr.Dropdown(
+                        label="Tool B: Atmosphere",
+                        choices=V2_KEYS,
+                        value=V2_KEYS[0],
+                        interactive=True,
+                        min_width=150
+                    )
                 strength_mult_slide = gr.Slider(label="Concept Divergence", minimum=0.2, maximum=1.0, value=0.9, step=0.05)