Spaces:

SWE-Arena
/

SWE-Model-Arena

Running

App Files Files Community

zhiminy commited on Dec 8, 2024

Commit

9b3a3bd

1 Parent(s): bedcfff

add more models

Browse files

Files changed (3) hide show

.gitignore +1 -0
app.py +18 -26
context_window.json +31 -21

.gitignore CHANGED Viewed

@@ -1,3 +1,4 @@
 *.env
 *.venv
 *.pem

 *.env
 *.venv
 *.pem
+*.ipynb

app.py CHANGED Viewed

@@ -6,36 +6,25 @@ import os
 import random
 import threading
-import aisuite as ai
 import gradio as gr
 import pandas as pd
 from huggingface_hub import upload_file, hf_hub_download, HfFolder, HfApi
 from datetime import datetime
 from gradio_leaderboard import Leaderboard
 # Load environment variables
 dotenv.load_dotenv()
-# Retrieve the secret from the environment
-gcp_credentials = os.environ.get("GCP_CREDENTIALS")
-# Write it to a file
-credentials_path = (
-    "/tmp/gcp_credentials.json"  # Ensure this path is secure and temporary
-)
-with open(credentials_path, "w") as f:
-    f.write(gcp_credentials)
-# Set the environment variable for GCP SDKs
-os.environ["GOOGLE_APPLICATION_CREDENTIALS"] = credentials_path
-# Timeout in seconds for model response
 TIMEOUT = 60
-# Initialize AISuite Client
-client = ai.Client()
 # Hint string constant
 SHOW_HINT_STRING = True  # Set to False to hide the hint string altogether
 HINT_STRING = "Once signed in, your votes will be recorded securely."
@@ -75,7 +64,9 @@ def truncate_prompt(user_input, model_alias, models, conversation_state):
     # Get the full conversation history for the model
     history = conversation_state.get(model_name, [])
-    full_conversation = [{"role": msg["role"], "content": msg["content"]} for msg in history]
     full_conversation.append({"role": "user", "content": user_input})
     # Convert to JSON string for accurate length measurement
@@ -100,7 +91,9 @@ def chat_with_models(
     user_input, model_alias, models, conversation_state, timeout=TIMEOUT
 ):
     model_name = models[model_alias]
-    truncated_input = truncate_prompt(user_input, model_alias, models, conversation_state)
     conversation_state.setdefault(model_name, []).append(
         {"role": "user", "content": user_input}
     )
@@ -110,10 +103,12 @@ def chat_with_models(
     def request_model_response():
         try:
-            response = client.chat.completions.create(
-                model=model_name,
-                messages=truncated_input,
-            )
             model_response["content"] = response.choices[0].message.content
         except Exception as e:
             model_response["error"] = f"{model_name} model is not available. Error: {e}"
@@ -128,15 +123,12 @@ def chat_with_models(
     response_event_occurred = response_event.wait(timeout)
     if not response_event_occurred:
-        # Timeout occurred, raise a TimeoutError to be handled in the Gradio interface
         raise TimeoutError(
             f"The {model_alias} model did not respond within {timeout} seconds."
         )
     elif model_response["error"]:
-        # An error occurred during model response
         raise Exception(model_response["error"])
     else:
-        # Successful response
         formatted_response = f"```\n{model_response['content']}\n```"
         conversation_state[model_name].append(
             {"role": "assistant", "content": model_response["content"]}

 import random
 import threading
 import gradio as gr
 import pandas as pd
 from huggingface_hub import upload_file, hf_hub_download, HfFolder, HfApi
 from datetime import datetime
 from gradio_leaderboard import Leaderboard
+from openai import OpenAI
 # Load environment variables
 dotenv.load_dotenv()
+# Initialize OpenAI Client
+api_key = os.getenv("API_KEY")
+base_url = "https://api.pandalla.ai/v1"
+openai_client = OpenAI(api_key=api_key, base_url=base_url)
+# Timeout in seconds for model responses
 TIMEOUT = 60
 # Hint string constant
 SHOW_HINT_STRING = True  # Set to False to hide the hint string altogether
 HINT_STRING = "Once signed in, your votes will be recorded securely."
     # Get the full conversation history for the model
     history = conversation_state.get(model_name, [])
+    full_conversation = [
+        {"role": msg["role"], "content": msg["content"]} for msg in history
+    ]
     full_conversation.append({"role": "user", "content": user_input})
     # Convert to JSON string for accurate length measurement
     user_input, model_alias, models, conversation_state, timeout=TIMEOUT
 ):
     model_name = models[model_alias]
+    truncated_input = truncate_prompt(
+        user_input, model_alias, models, conversation_state
+    )
     conversation_state.setdefault(model_name, []).append(
         {"role": "user", "content": user_input}
     )
     def request_model_response():
         try:
+            request_params = {
+                "model": model_name,
+                "messages": truncated_input,
+                "temperature": 0,
+            }
+            response = openai_client.chat.completions.create(**request_params)
             model_response["content"] = response.choices[0].message.content
         except Exception as e:
             model_response["error"] = f"{model_name} model is not available. Error: {e}"
     response_event_occurred = response_event.wait(timeout)
     if not response_event_occurred:
         raise TimeoutError(
             f"The {model_alias} model did not respond within {timeout} seconds."
         )
     elif model_response["error"]:
         raise Exception(model_response["error"])
     else:
         formatted_response = f"```\n{model_response['content']}\n```"
         conversation_state[model_name].append(
             {"role": "assistant", "content": model_response["content"]}

context_window.json CHANGED Viewed

@@ -1,23 +1,33 @@
 {
-    "anthropic:claude-3-5-sonnet-latest": 200000,
-    "anthropic:claude-3-5-haiku-latest": 200000,
-    "anthropic:claude-3-sonnet-20240229": 200000,
-    "anthropic:claude-3-haiku-20240307": 200000,
-    "anthropic:claude-3-opus-latest": 200000,
-    "google:gemini-1.5-flash": 1048576,
-    "google:gemini-1.5-pro": 2097152,
-    "groq:gemma2-9b-it": 8192,
-    "groq:gemma-7b-it": 8192,
-    "groq:llama-3.1-8b-instant": 128000,
-    "groq:llama-3.1-70b-versatile": 128000,
-    "groq:llama-3.2-1b-preview": 128000,
-    "groq:llama-3.2-3b-preview": 128000,
-    "openai:gpt-3.5-turbo": 16385,
-    "openai:gpt-4": 8192,
-    "openai:gpt-4-turbo": 128000,
-    "openai:gpt-4o": 128000,
-    "openai:chatgpt-4o-latest": 128000,
-    "openai:gpt-4o-mini": 128000,
-    "openai:o1-preview": 128000,
-    "openai:o1-mini": 128000
 }

 {
+    "gpt-3.5-turbo": 16000,
+    "gpt-3.5-turbo-16k": 16000,
+    "gpt-3.5-turbo-instruct" : 16000,
+    "gpt-4": 8192,
+    "gpt-4-32k": 32000,
+    "gpt-4-turbo": 128000,
+    "gpt-4o": 128000,
+    "gpt-4o-mini": 128000,
+    "chatgpt-4o-latest": 128000,
+    "claude-3-5-sonnet-latest" : 200000,
+    "deepseek-chat": 64000,
+    "gemini-1.5-flash-latest": 1048576,
+    "gemini-1.5-pro-latest": 2097152,
+    "Hunyuan-A52B-Instruct": 128000,
+    "llama-3-70b": 128000,
+    "llama-3.1-405b": 128000,
+    "llama-3.1-70b": 128000,
+    "llama-3.1-8b": 128000,
+    "llama-3.3-70b": 128000,
+    "llama-v3.2-3b": 128000,
+    "o1-all": 128000,
+    "o1-mini-all": 128000,
+    "o1-preview-all": 128000,
+    "Qwen2-72B-Instruct": 131072,
+    "Qwen2.5-32B-Instruct": 131072,
+    "qwen2.5-72b": 32768,
+    "Qwen2.5-72B-Instruct": 131072,
+    "Qwen2.5-72B-Instruct-128k": 131072,
+    "Qwen2.5-Coder-32B-Instruct": 131072,
+    "QwQ-32B-Preview": 32768,
+    "yi-large": 32000
 }