Spaces:

k-mktr
/

gpu-poor-llm-arena

Running

App Files Files Community

k-mktr commited on Oct 22, 2024

Commit

4af6b14

verified ·

1 Parent(s): 7510128

Update app.py

Browse files

Files changed (1) hide show

app.py +75 -12

app.py CHANGED Viewed

@@ -6,12 +6,16 @@ import logging
 import arena_config
 import plotly.graph_objects as go
 from typing import Dict
-from leaderboard import get_current_leaderboard, update_leaderboard
 # Initialize logging for errors only
 logging.basicConfig(level=logging.ERROR)
 logger = logging.getLogger(__name__)
 # Function to get available models (using predefined list)
 def get_available_models():
     return [model[0] for model in arena_config.APPROVED_MODELS]
@@ -57,9 +61,15 @@ def battle_arena(prompt):
     nickname_a = random.choice(arena_config.model_nicknames)
     nickname_b = random.choice(arena_config.model_nicknames)
-    # Format responses for gr.Chatbot
-    response_a_formatted = [{"role": "assistant", "content": response_a}]
-    response_b_formatted = [{"role": "assistant", "content": response_b}]
     if random.choice([True, False]):
         return (
@@ -67,7 +77,10 @@ def battle_arena(prompt):
             gr.update(label=nickname_a, value=response_a_formatted),
             gr.update(label=nickname_b, value=response_b_formatted),
             gr.update(interactive=True, value=f"Vote for {nickname_a}"),
-            gr.update(interactive=True, value=f"Vote for {nickname_b}")
         )
     else:
         return (
@@ -75,7 +88,10 @@ def battle_arena(prompt):
             gr.update(label=nickname_a, value=response_b_formatted),
             gr.update(label=nickname_b, value=response_a_formatted),
             gr.update(interactive=True, value=f"Vote for {nickname_a}"),
-            gr.update(interactive=True, value=f"Vote for {nickname_b}")
         )
 def record_vote(prompt, left_response, right_response, left_model, right_model, choice):
@@ -108,6 +124,7 @@ def record_vote(prompt, left_response, right_response, left_model, right_model,
         get_leaderboard(),                              # Update leaderboard
         gr.update(interactive=False),                   # Disable left vote button
         gr.update(interactive=False),                   # Disable right vote button
         gr.update(visible=True),                        # Show model names
         get_leaderboard_chart()                         # Update leaderboard chart
     )
@@ -182,6 +199,12 @@ def get_leaderboard():
             rank_display = "🥈"
         elif index == 3:
             rank_display = "🥉"
         else:
             rank_display = f"{index}"
@@ -295,10 +318,12 @@ def new_battle():
         None,
         gr.update(interactive=False, value=f"Vote for {nickname_a}"),
         gr.update(interactive=False, value=f"Vote for {nickname_b}"),
         gr.update(value="", visible=False),
         gr.update(),
         gr.update(visible=False),
-        gr.update()
     )
 # Add this new function
@@ -310,6 +335,33 @@ def get_human_readable_name(model_name: str) -> str:
 def random_prompt():
     return random.choice(arena_config.example_prompts)
 # Initialize Gradio Blocks
 with gr.Blocks(css="""
     #dice-button {
@@ -346,6 +398,7 @@ with gr.Blocks(css="""
         with gr.Row():
             left_vote_btn = gr.Button(f"Vote for {left_output.label}", interactive=False)
             right_vote_btn = gr.Button(f"Vote for {right_output.label}", interactive=False)
         result = gr.Textbox(label="Result", interactive=False, visible=False)
@@ -354,6 +407,9 @@ with gr.Blocks(css="""
             left_model = gr.Textbox(label="🔵 Left Model", interactive=False)
             right_model = gr.Textbox(label="🔴 Right Model", interactive=False)
         new_battle_btn = gr.Button("New Battle")
     # Leaderboard Tab
@@ -369,28 +425,35 @@ with gr.Blocks(css="""
         battle_arena,
         inputs=prompt_input,
         outputs=[left_output, right_output, left_model, right_model,
-                 left_output, right_output, left_vote_btn, right_vote_btn]
     )
     left_vote_btn.click(
         lambda *args: record_vote(*args, "Left is better"),
         inputs=[prompt_input, left_output, right_output, left_model, right_model],
         outputs=[result, leaderboard, left_vote_btn,
-                 right_vote_btn, model_names_row, leaderboard_chart]
     )
     right_vote_btn.click(
         lambda *args: record_vote(*args, "Right is better"),
         inputs=[prompt_input, left_output, right_output, left_model, right_model],
         outputs=[result, leaderboard, left_vote_btn,
-                 right_vote_btn, model_names_row, leaderboard_chart]
     )
     new_battle_btn.click(
         new_battle,
         outputs=[prompt_input, left_output, right_output, left_model,
-                 right_model, left_vote_btn, right_vote_btn,
-                 result, leaderboard, model_names_row, leaderboard_chart]
     )
     # Update leaderboard and chart on launch

 import arena_config
 import plotly.graph_objects as go
 from typing import Dict
+from leaderboard import get_current_leaderboard, update_leaderboard, start_backup_thread
 # Initialize logging for errors only
 logging.basicConfig(level=logging.ERROR)
 logger = logging.getLogger(__name__)
+# Start the backup thread
+start_backup_thread()
 # Function to get available models (using predefined list)
 def get_available_models():
     return [model[0] for model in arena_config.APPROVED_MODELS]
     nickname_a = random.choice(arena_config.model_nicknames)
     nickname_b = random.choice(arena_config.model_nicknames)
+    # Format responses for gr.Chatbot, including the user's prompt
+    response_a_formatted = [
+        {"role": "user", "content": prompt},
+        {"role": "assistant", "content": response_a}
+    ]
+    response_b_formatted = [
+        {"role": "user", "content": prompt},
+        {"role": "assistant", "content": response_b}
+    ]
     if random.choice([True, False]):
         return (
             gr.update(label=nickname_a, value=response_a_formatted),
             gr.update(label=nickname_b, value=response_b_formatted),
             gr.update(interactive=True, value=f"Vote for {nickname_a}"),
+            gr.update(interactive=True, value=f"Vote for {nickname_b}"),
+            gr.update(interactive=True, visible=True),  # Enable and show Tie button
+            prompt,  # Return the original prompt
+            0  # Initialize tie count
         )
     else:
         return (
             gr.update(label=nickname_a, value=response_b_formatted),
             gr.update(label=nickname_b, value=response_a_formatted),
             gr.update(interactive=True, value=f"Vote for {nickname_a}"),
+            gr.update(interactive=True, value=f"Vote for {nickname_b}"),
+            gr.update(interactive=True, visible=True),  # Enable and show Tie button
+            prompt,  # Return the original prompt
+            0  # Initialize tie count
         )
 def record_vote(prompt, left_response, right_response, left_model, right_model, choice):
         get_leaderboard(),                              # Update leaderboard
         gr.update(interactive=False),                   # Disable left vote button
         gr.update(interactive=False),                   # Disable right vote button
+        gr.update(interactive=False),                   # Disable tie button
         gr.update(visible=True),                        # Show model names
         get_leaderboard_chart()                         # Update leaderboard chart
     )
             rank_display = "🥈"
         elif index == 3:
             rank_display = "🥉"
+        elif index == 18:
+            rank_display = "😞"
+        elif index == 19:
+            rank_display = "😰"
+        elif index == 20:
+            rank_display = "😭"
         else:
             rank_display = f"{index}"
         None,
         gr.update(interactive=False, value=f"Vote for {nickname_a}"),
         gr.update(interactive=False, value=f"Vote for {nickname_b}"),
+        gr.update(interactive=False, visible=False),  # Reset Tie button
         gr.update(value="", visible=False),
         gr.update(),
         gr.update(visible=False),
+        gr.update(),
+        0  # Reset tie_count
     )
 # Add this new function
 def random_prompt():
     return random.choice(arena_config.example_prompts)
+# Modify the continue_conversation function
+def continue_conversation(prompt, left_chat, right_chat, left_model, right_model, previous_prompt, tie_count):
+    # Check if the prompt is empty or the same as the previous one
+    if not prompt or prompt == previous_prompt:
+        prompt = random.choice(arena_config.example_prompts)
+    left_response = call_ollama_api(left_model, prompt)
+    right_response = call_ollama_api(right_model, prompt)
+    left_chat.append({"role": "user", "content": prompt})
+    left_chat.append({"role": "assistant", "content": left_response})
+    right_chat.append({"role": "user", "content": prompt})
+    right_chat.append({"role": "assistant", "content": right_response})
+    tie_count += 1
+    tie_button_state = gr.update(interactive=True) if tie_count < 3 else gr.update(interactive=False, value="Max ties reached. Please vote!")
+    return (
+        gr.update(value=left_chat),
+        gr.update(value=right_chat),
+        gr.update(value=""),  # Clear the prompt input
+        tie_button_state,
+        prompt,  # Return the new prompt
+        tie_count
+    )
 # Initialize Gradio Blocks
 with gr.Blocks(css="""
     #dice-button {
         with gr.Row():
             left_vote_btn = gr.Button(f"Vote for {left_output.label}", interactive=False)
+            tie_btn = gr.Button("Tie 🙈 Continue with a new prompt", interactive=False, visible=False)
             right_vote_btn = gr.Button(f"Vote for {right_output.label}", interactive=False)
         result = gr.Textbox(label="Result", interactive=False, visible=False)
             left_model = gr.Textbox(label="🔵 Left Model", interactive=False)
             right_model = gr.Textbox(label="🔴 Right Model", interactive=False)
+        previous_prompt = gr.State("")  # Add this line to store the previous prompt
+        tie_count = gr.State(0)  # Add this line to keep track of tie count
         new_battle_btn = gr.Button("New Battle")
     # Leaderboard Tab
         battle_arena,
         inputs=prompt_input,
         outputs=[left_output, right_output, left_model, right_model,
+                 left_output, right_output, left_vote_btn, right_vote_btn,
+                 tie_btn, previous_prompt, tie_count]
     )
     left_vote_btn.click(
         lambda *args: record_vote(*args, "Left is better"),
         inputs=[prompt_input, left_output, right_output, left_model, right_model],
         outputs=[result, leaderboard, left_vote_btn,
+                 right_vote_btn, tie_btn, model_names_row, leaderboard_chart]
     )
     right_vote_btn.click(
         lambda *args: record_vote(*args, "Right is better"),
         inputs=[prompt_input, left_output, right_output, left_model, right_model],
         outputs=[result, leaderboard, left_vote_btn,
+                 right_vote_btn, tie_btn, model_names_row, leaderboard_chart]
+    )
+    tie_btn.click(
+        continue_conversation,
+        inputs=[prompt_input, left_output, right_output, left_model, right_model, previous_prompt, tie_count],
+        outputs=[left_output, right_output, prompt_input, tie_btn, previous_prompt, tie_count]
     )
     new_battle_btn.click(
         new_battle,
         outputs=[prompt_input, left_output, right_output, left_model,
+                right_model, left_vote_btn, right_vote_btn, tie_btn,
+                result, leaderboard, model_names_row, leaderboard_chart, tie_count]
     )
     # Update leaderboard and chart on launch